CIVL v0.11 of 2014-04-22 -- http://vsl.cis.udel.edu/civl 1 2 speedup ------- Elapsed time in CPU: 1 milliseconds ample processes at state 716: 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 State 716 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p3], 1:=X_s16v1[0][1][0:=p4], 2:=X_s16v1[0][2][0:=p5], 3:=X_s16v1[0][3][0:=p6]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p7], 1:=X_s16v1[1][1][0:=p8], 2:=X_s16v1[1][2][0:=p9], 3:=X_s16v1[1][3][0:=p10]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p11], 1:=X_s16v1[2][1][0:=p12], 2:=X_s16v1[2][2][0:=p13], 3:=X_s16v1[2][3][0:=p14]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p15], 1:=X_s16v1[3][1][0:=p16], 2:=X_s16v1[3][2][0:=p17], 3:=X_s16v1[3][3][0:=p18]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d122 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d121 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d126 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d125 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d130 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d129 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d134 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d133 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d139 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d138 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d143 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=43, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=44, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=45, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=46, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=47, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=48, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=49, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=50, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=51, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=52, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] | | process p14(id=14) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d168] | | process p15(id=15) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d173] | | process p16(id=16) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d177] | | process p17(id=17) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d181] | | process p18(id=18) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d185] ample processes at state 721: 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 State 721 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=p3], 2:=X_s16v1[0][2][0:=p4], 3:=X_s16v1[0][3][0:=p5]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p6], 1:=X_s16v1[1][1][0:=p7], 2:=X_s16v1[1][2][0:=p8], 3:=X_s16v1[1][3][0:=p9]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p10], 1:=X_s16v1[2][1][0:=p11], 2:=X_s16v1[2][2][0:=p12], 3:=X_s16v1[2][3][0:=p13]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p14], 1:=X_s16v1[3][1][0:=p15], 2:=X_s16v1[3][2][0:=p16], 3:=X_s16v1[3][3][0:=p17]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d126 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d125 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d130 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d129 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d134 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d133 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d139 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d138 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d143 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=43, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=44, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=45, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=46, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=47, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=48, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=49, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=50, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] | | process p14(id=14) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d168] | | process p15(id=15) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d173] | | process p16(id=16) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d177] | | process p17(id=17) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d181] ample processes at state 726: 3 4 5 6 7 8 9 10 11 12 13 14 15 16 State 726 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=p3], 3:=X_s16v1[0][3][0:=p4]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p5], 1:=X_s16v1[1][1][0:=p6], 2:=X_s16v1[1][2][0:=p7], 3:=X_s16v1[1][3][0:=p8]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p9], 1:=X_s16v1[2][1][0:=p10], 2:=X_s16v1[2][2][0:=p11], 3:=X_s16v1[2][3][0:=p12]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p13], 1:=X_s16v1[3][1][0:=p14], 2:=X_s16v1[3][2][0:=p15], 3:=X_s16v1[3][3][0:=p16]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d130 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d129 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d134 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d133 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d139 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d138 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d143 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=43, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=44, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=45, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=46, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=47, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=48, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] | | process p14(id=14) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d168] | | process p15(id=15) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d173] | | process p16(id=16) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d177] ample processes at state 731: 3 4 5 6 7 8 9 10 11 12 13 14 15 State 731 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=p3]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p4], 1:=X_s16v1[1][1][0:=p5], 2:=X_s16v1[1][2][0:=p6], 3:=X_s16v1[1][3][0:=p7]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p8], 1:=X_s16v1[2][1][0:=p9], 2:=X_s16v1[2][2][0:=p10], 3:=X_s16v1[2][3][0:=p11]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p12], 1:=X_s16v1[3][1][0:=p13], 2:=X_s16v1[3][2][0:=p14], 3:=X_s16v1[3][3][0:=p15]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d134 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d133 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d139 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d138 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d143 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=43, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=44, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=45, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=46, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] | | process p14(id=14) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d168] | | process p15(id=15) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d173] ample processes at state 738: 3 4 5 6 7 8 9 10 11 12 13 14 State 738 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p3], 1:=X_s16v1[1][1][0:=p4], 2:=X_s16v1[1][2][0:=p5], 3:=X_s16v1[1][3][0:=p6]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p7], 1:=X_s16v1[2][1][0:=p8], 2:=X_s16v1[2][2][0:=p9], 3:=X_s16v1[2][3][0:=p10]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p11], 1:=X_s16v1[3][1][0:=p12], 2:=X_s16v1[3][2][0:=p13], 3:=X_s16v1[3][3][0:=p14]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d139 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d138 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d143 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=43, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=44, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] | | process p14(id=14) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d168] ample processes at state 743: 3 4 5 6 7 8 9 10 11 12 13 State 743 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=p3], 2:=X_s16v1[1][2][0:=p4], 3:=X_s16v1[1][3][0:=p5]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p6], 1:=X_s16v1[2][1][0:=p7], 2:=X_s16v1[2][2][0:=p8], 3:=X_s16v1[2][3][0:=p9]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p10], 1:=X_s16v1[3][1][0:=p11], 2:=X_s16v1[3][2][0:=p12], 3:=X_s16v1[3][3][0:=p13]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d143 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d142 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d147 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=41, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=42, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] | | process p13(id=13) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d164] ample processes at state 748: 3 4 5 6 7 8 9 10 11 12 State 748 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=p3], 3:=X_s16v1[1][3][0:=p4]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p5], 1:=X_s16v1[2][1][0:=p6], 2:=X_s16v1[2][2][0:=p7], 3:=X_s16v1[2][3][0:=p8]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p9], 1:=X_s16v1[3][1][0:=p10], 2:=X_s16v1[3][2][0:=p11], 3:=X_s16v1[3][3][0:=p12]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d147 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d146 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d151 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=39, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=40, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] | | process p12(id=12) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d160] ample processes at state 753: 3 4 5 6 7 8 9 10 11 State 753 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=p3]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p4], 1:=X_s16v1[2][1][0:=p5], 2:=X_s16v1[2][2][0:=p6], 3:=X_s16v1[2][3][0:=p7]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p8], 1:=X_s16v1[3][1][0:=p9], 2:=X_s16v1[3][2][0:=p10], 3:=X_s16v1[3][3][0:=p11]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d151 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d150 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d156 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=37, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=38, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] | | process p11(id=11) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d156] ample processes at state 760: 3 4 5 6 7 8 9 10 State 760 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p3], 1:=X_s16v1[2][1][0:=p4], 2:=X_s16v1[2][2][0:=p5], 3:=X_s16v1[2][3][0:=p6]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p7], 1:=X_s16v1[3][1][0:=p8], 2:=X_s16v1[3][2][0:=p9], 3:=X_s16v1[3][3][0:=p10]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d156 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d155 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d160 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=35, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=36, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] | | process p10(id=10) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d151] ample processes at state 765: 3 4 5 6 7 8 9 State 765 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p3], 2:=X_s16v1[2][2][0:=p4], 3:=X_s16v1[2][3][0:=p5]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p6], 1:=X_s16v1[3][1][0:=p7], 2:=X_s16v1[3][2][0:=p8], 3:=X_s16v1[3][3][0:=p9]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d160 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d159 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d164 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=33, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=34, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] | | process p9(id=9) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d147] ample processes at state 770: 3 4 5 6 7 8 State 770 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p3], 3:=X_s16v1[2][3][0:=p4]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p5], 1:=X_s16v1[3][1][0:=p6], 2:=X_s16v1[3][2][0:=p7], 3:=X_s16v1[3][3][0:=p8]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d164 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d163 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d168 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=31, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=32, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] | | process p8(id=8) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d143] ample processes at state 775: 3 4 5 6 7 State 775 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p3]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p4], 1:=X_s16v1[3][1][0:=p5], 2:=X_s16v1[3][2][0:=p6], 3:=X_s16v1[3][3][0:=p7]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d168 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d167 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d173 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=29, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=30, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] | | process p7(id=7) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d139] ample processes at state 782: 3 4 5 6 State 782 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p3], 1:=X_s16v1[3][1][0:=p4], 2:=X_s16v1[3][2][0:=p5], 3:=X_s16v1[3][3][0:=p6]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d173 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d172 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d177 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=27, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=28, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] | | process p6(id=6) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d134] ample processes at state 787: 3 4 5 State 787 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=p3], 2:=X_s16v1[3][2][0:=p4], 3:=X_s16v1[3][3][0:=p5]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d177 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d176 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d181 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=25, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=26, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] | | process p5(id=5) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d130] ample processes at state 792: 3 4 State 792 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[2][])],H_p0s6v0i0l1[0:=__struct_2__]>,(_kernelInstanceNode_[2][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>]>,(__struct_3__[1][])heap<1,1>[0],true>]>,(pointer[4][])heap<0,0>[0]],H_p0s4v0i3l2[0:=&heap<0,0>[0]],UNDEFINED>,(__struct_4__[3][])heap<3,2>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,1>[0],1>],UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = X_s1v5 | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<7,0>[0] | | | | G_B = &heap<8,0>[0] | | | | G_C = &heap<9,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = NULL | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = NULL | | | | _anon_8 = NULL | | | | _anon_9 = NULL | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d95 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<9,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,1>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d93 (id=7, parent=d0, static=70) | | | variables | | | | this = &heap<0,1>[0] | | | | e = &heap<4,2>[0] | | dyscope d81 (id=8, parent=d0, static=46) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<7,0>[0] | | | | B = &heap<8,0>[0] | | | | C = &heap<9,0>[0] | | | | width = 4 | | dyscope d114 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d113 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d112 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d105 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p2]]] | | dyscope d104 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d111 (id=14, parent=d0, static=79) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | dyscope d110 (id=15, parent=d0, static=77) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d188 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d187 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d186 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d116 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=UNDEFINED], 2:=X_s16v1[3][2][0:=p3], 3:=X_s16v1[3][3][0:=p4]]] | | dyscope d115 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d181 (id=21, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d180 (id=22, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d185 (id=23, parent=d0, static=83) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d184 (id=24, parent=d0, static=80) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d95] | | | | Frame[function=_main, location=231, f0:224.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d114] | | | | Frame[function=_kernel, location=275, f0:69.8-17 "_runProcs", dyscope=d93] | | process p2(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d188] | | | | Frame[function=_block, location=284, f0:66.12-21 "_runProcs", dyscope=d111] | | process p3(id=3) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d122] | | process p4(id=4) | | | call stack | | | | Frame[function=_thread, location=303, f0:63.16-36 "C[row * width + ... ]", dyscope=d126] Elapsed time in GPU (global memory): 1 milliseconds 1 a b ample processes at state 1124: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1124 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3 | | | | B_shared = X_s14v4 | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d401 (id=24, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d403 (id=27, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=28, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=29, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=36, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=39, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=40, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=41, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1125: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1125 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1]] | | | | B_shared = X_s14v4 | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d401 (id=24, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d403 (id=27, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=28, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=29, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=36, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=39, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=40, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=41, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1127: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1127 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d403 (id=28, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=31, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=32, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=33, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=40, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=43, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=44, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=45, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1128: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1128 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d403 (id=28, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=31, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=32, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=33, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=40, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=43, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=44, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=45, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1130: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1130 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=32, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=35, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=36, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=37, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=44, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=47, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=48, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=49, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1131: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1131 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d405 (id=32, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=35, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=36, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=37, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=44, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=47, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=48, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=49, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1133: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1133 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=36, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=39, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=40, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=41, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1134: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1134 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d407 (id=36, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=39, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=40, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=41, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1136: 8 9 10 11 12 13 14 15 16 17 18 19 State 1136 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=40, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=43, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=44, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=45, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1137: 8 9 10 11 12 13 14 15 16 17 18 19 State 1137 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d409 (id=40, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=43, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=44, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=45, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1139: 9 10 11 12 13 14 15 16 17 18 19 State 1139 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=44, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=47, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=48, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=49, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1140: 9 10 11 12 13 14 15 16 17 18 19 State 1140 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d411 (id=44, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=47, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=48, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=49, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1142: 10 11 12 13 14 15 16 17 18 19 State 1142 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1143: 10 11 12 13 14 15 16 17 18 19 State 1143 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d413 (id=48, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=51, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=52, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=53, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1145: 11 12 13 14 15 16 17 18 19 State 1145 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1146: 11 12 13 14 15 16 17 18 19 State 1146 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d415 (id=52, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=53, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=54, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=55, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=56, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=57, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1148: 12 13 14 15 16 17 18 19 State 1148 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1149: 12 13 14 15 16 17 18 19 State 1149 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d417 (id=56, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=57, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=58, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=59, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=60, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=61, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1151: 13 14 15 16 17 18 19 State 1151 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=75, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=76, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=77, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1152: 13 14 15 16 17 18 19 State 1152 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d419 (id=60, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=61, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=62, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=63, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=64, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=65, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=75, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=76, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=77, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1154: 14 15 16 17 18 19 State 1154 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=76, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=77, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=78, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1155: 14 15 16 17 18 19 State 1155 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d421 (id=64, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=65, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=66, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=67, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=68, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=69, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=76, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=77, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=78, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1157: 15 16 17 18 19 State 1157 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=77, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=78, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=79, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1158: 15 16 17 18 19 State 1158 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d423 (id=68, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=69, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=70, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=71, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=72, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=73, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=77, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=78, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=79, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1160: 16 17 18 19 State 1160 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=75, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=76, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=77, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1161: 16 17 18 19 State 1161 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d425 (id=72, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=73, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=74, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=75, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=76, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=77, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1163: 17 18 19 State 1163 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=76, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=77, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=78, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=79, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=80, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=81, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1164: 17 18 19 State 1164 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d427 (id=76, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=77, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=78, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=79, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=80, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=81, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1166: 18 19 State 1166 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d427 (id=77, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=78, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=79, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=80, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=81, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=82, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1167: 18 19 State 1167 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d427 (id=77, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=78, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=79, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d429 (id=80, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=81, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=82, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=319, f0:112.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=318, f0:110.20-36 "B_shared[ty][tx]", dyscope=d427] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=317, f0:108.20-36 "A_shared[ty][tx]", dyscope=d429] ample processes at state 1203: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1203 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d447 (id=21, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d399 (id=22, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 0 | | dyscope d330 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d447] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1205: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1205 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d447 (id=21, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d399 (id=22, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 1 | | dyscope d330 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d447] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1207: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1207 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d447 (id=21, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d399 (id=22, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 2 | | dyscope d330 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d447] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1209: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1209 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d447 (id=21, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d399 (id=22, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 3 | | dyscope d330 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d447] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1212: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1212 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 0 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1214: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1214 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 1 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1216: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1216 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 2 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1218: 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1218 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),1>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d448 (id=25, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d401 (id=26, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 3 | | dyscope d334 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d448] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1221: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1221 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 0 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1223: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1223 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 1 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1225: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1225 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 2 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1227: 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1227 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),2>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d449 (id=29, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d403 (id=30, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 3 | | dyscope d338 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d449] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1230: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1230 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 0 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1232: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1232 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 1 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1234: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1234 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 2 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1236: 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1236 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),3>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d450 (id=33, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d405 (id=34, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 3 | | dyscope d342 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d450] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1239: 8 9 10 11 12 13 14 15 16 17 18 19 State 1239 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 0 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1241: 8 9 10 11 12 13 14 15 16 17 18 19 State 1241 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 1 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1243: 8 9 10 11 12 13 14 15 16 17 18 19 State 1243 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 2 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1245: 8 9 10 11 12 13 14 15 16 17 18 19 State 1245 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),4>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d451 (id=37, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d407 (id=38, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 3 | | dyscope d347 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d451] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1248: 9 10 11 12 13 14 15 16 17 18 19 State 1248 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 0 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1250: 9 10 11 12 13 14 15 16 17 18 19 State 1250 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 1 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1252: 9 10 11 12 13 14 15 16 17 18 19 State 1252 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 2 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1254: 9 10 11 12 13 14 15 16 17 18 19 State 1254 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),5>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d452 (id=41, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d409 (id=42, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 3 | | dyscope d351 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d452] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1257: 10 11 12 13 14 15 16 17 18 19 State 1257 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 0 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1259: 10 11 12 13 14 15 16 17 18 19 State 1259 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 1 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1261: 10 11 12 13 14 15 16 17 18 19 State 1261 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 2 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1263: 10 11 12 13 14 15 16 17 18 19 State 1263 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),6>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d453 (id=45, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d411 (id=46, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 3 | | dyscope d355 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d453] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1266: 11 12 13 14 15 16 17 18 19 State 1266 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 0 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1268: 11 12 13 14 15 16 17 18 19 State 1268 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 1 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1270: 11 12 13 14 15 16 17 18 19 State 1270 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 2 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1272: 11 12 13 14 15 16 17 18 19 State 1272 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),7>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d454 (id=49, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d413 (id=50, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 3 | | dyscope d359 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d454] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1275: 12 13 14 15 16 17 18 19 State 1275 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 0 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1277: 12 13 14 15 16 17 18 19 State 1277 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 1 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1279: 12 13 14 15 16 17 18 19 State 1279 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 2 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1281: 12 13 14 15 16 17 18 19 State 1281 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),8>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d455 (id=53, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d415 (id=54, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=55, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 3 | | dyscope d364 (id=56, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d455] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1284: 13 14 15 16 17 18 19 State 1284 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 0 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1286: 13 14 15 16 17 18 19 State 1286 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 1 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1288: 13 14 15 16 17 18 19 State 1288 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 2 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1290: 13 14 15 16 17 18 19 State 1290 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),9>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d456 (id=57, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d417 (id=58, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=59, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 3 | | dyscope d368 (id=60, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d456] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1293: 14 15 16 17 18 19 State 1293 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 0 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1295: 14 15 16 17 18 19 State 1295 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 1 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1297: 14 15 16 17 18 19 State 1297 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 2 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1299: 14 15 16 17 18 19 State 1299 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),10>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d457 (id=61, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d419 (id=62, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=63, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 3 | | dyscope d372 (id=64, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d457] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1302: 15 16 17 18 19 State 1302 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 0 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1304: 15 16 17 18 19 State 1304 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 1 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1306: 15 16 17 18 19 State 1306 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 2 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1308: 15 16 17 18 19 State 1308 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),11>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d458 (id=65, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d421 (id=66, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=67, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 3 | | dyscope d376 (id=68, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d458] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1311: 16 17 18 19 State 1311 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 0 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1313: 16 17 18 19 State 1313 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 1 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1315: 16 17 18 19 State 1315 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 2 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1317: 16 17 18 19 State 1317 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),12>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d459 (id=69, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d423 (id=70, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=71, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 3 | | dyscope d381 (id=72, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d459] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1320: 17 18 19 State 1320 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 0 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1322: 17 18 19 State 1322 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 1 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1324: 17 18 19 State 1324 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 2 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1326: 17 18 19 State 1326 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),13>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d460 (id=73, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d425 (id=74, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=75, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 3 | | dyscope d385 (id=76, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d460] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1329: 18 19 State 1329 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 0 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1331: 18 19 State 1331 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 1 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 1 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1333: 18 19 State 1333 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 2 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 2 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1335: 18 19 State 1335 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),14>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d399 (id=21, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d331 (id=22, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=23, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d430 (id=24, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d401 (id=25, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d335 (id=26, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=27, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d431 (id=28, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d403 (id=29, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d339 (id=30, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=31, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d432 (id=32, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d405 (id=33, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d343 (id=34, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=35, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d433 (id=36, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d407 (id=37, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d348 (id=38, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=39, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d434 (id=40, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d409 (id=41, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d352 (id=42, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=43, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d435 (id=44, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d411 (id=45, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d356 (id=46, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=47, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d436 (id=48, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d413 (id=49, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d360 (id=50, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=51, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d437 (id=52, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d415 (id=53, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d365 (id=54, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=55, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d438 (id=56, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d417 (id=57, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d369 (id=58, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=59, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d439 (id=60, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d419 (id=61, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d373 (id=62, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=63, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d440 (id=64, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d421 (id=65, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d377 (id=66, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=67, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d441 (id=68, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d423 (id=69, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d382 (id=70, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=71, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d442 (id=72, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d425 (id=73, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d386 (id=74, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=75, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d443 (id=76, parent=d0, static=13) | | | variables | | | | barrier = &heap<14,0>[0] | | dyscope d461 (id=77, parent=d0, static=87) | | | variables | | | | k = 3 | | dyscope d427 (id=78, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d390 (id=79, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 3 | | dyscope d389 (id=80, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d446 (id=81, parent=d0, static=87) | | | variables | | | | k = 0 | | dyscope d429 (id=82, parent=d0, static=86) | | | variables | | | | phase = 0 | | dyscope d394 (id=83, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 0 | | dyscope d393 (id=84, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d430] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d399] | | process p22(id=5) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d431] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d401] | | process p23(id=6) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d432] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d403] | | process p24(id=7) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d433] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d405] | | process p25(id=8) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d434] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d407] | | process p26(id=9) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d435] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d409] | | process p27(id=10) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d436] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d411] | | process p28(id=11) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d437] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d413] | | process p29(id=12) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d438] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d415] | | process p30(id=13) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d439] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d417] | | process p31(id=14) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d440] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d419] | | process p32(id=15) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d441] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d421] | | process p33(id=16) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d442] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d423] | | process p34(id=17) | | | call stack | | | | Frame[function=$barrier_call, location=17, f1:133.2-15 "$barrier_exit", dyscope=d443] | | | | Frame[function=_thread, location=324, f0:118.20-33 "$barrier_call", dyscope=d425] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d461] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=322, f0:115.24-30 "result", dyscope=d446] ample processes at state 1378: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 State 1378 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=p21], 1:=X_s16v1[0][1][0:=p22], 2:=X_s16v1[0][2][0:=p23], 3:=X_s16v1[0][3][0:=p24]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p25], 1:=X_s16v1[1][1][0:=p26], 2:=X_s16v1[1][2][0:=p27], 3:=X_s16v1[1][3][0:=p28]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p29], 1:=X_s16v1[2][1][0:=p30], 2:=X_s16v1[2][2][0:=p31], 3:=X_s16v1[2][3][0:=p32]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p33], 1:=X_s16v1[3][1][0:=p34], 2:=X_s16v1[3][2][0:=p35], 3:=X_s16v1[3][3][0:=p36]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d331 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<0,&heap<13,0>[0]>>>> | | | | _tid = 0 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 0 | | | | row = 0 | | | | col = 0 | | | | result = 4 | | dyscope d330 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,0,0> | | dyscope d335 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d339 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d343 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d348 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d352 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=51, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=52, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d377] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d382] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d386] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d390] | | process p36(id=19) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d394] ample processes at state 1383: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 State 1383 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=p21], 2:=X_s16v1[0][2][0:=p22], 3:=X_s16v1[0][3][0:=p23]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p24], 1:=X_s16v1[1][1][0:=p25], 2:=X_s16v1[1][2][0:=p26], 3:=X_s16v1[1][3][0:=p27]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p28], 1:=X_s16v1[2][1][0:=p29], 2:=X_s16v1[2][2][0:=p30], 3:=X_s16v1[2][3][0:=p31]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p32], 1:=X_s16v1[3][1][0:=p33], 2:=X_s16v1[3][2][0:=p34], 3:=X_s16v1[3][3][0:=p35]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d335 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<4,&heap<13,0>[0]>>>> | | | | _tid = 4 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 1 | | | | row = 1 | | | | col = 0 | | | | result = 4 | | dyscope d334 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,1,0> | | dyscope d339 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d343 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d348 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d352 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=49, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=50, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d377] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d382] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d386] | | process p35(id=18) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d390] ample processes at state 1388: 4 5 6 7 8 9 10 11 12 13 14 15 16 17 State 1388 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=p21], 3:=X_s16v1[0][3][0:=p22]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p23], 1:=X_s16v1[1][1][0:=p24], 2:=X_s16v1[1][2][0:=p25], 3:=X_s16v1[1][3][0:=p26]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p27], 1:=X_s16v1[2][1][0:=p28], 2:=X_s16v1[2][2][0:=p29], 3:=X_s16v1[2][3][0:=p30]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p31], 1:=X_s16v1[3][1][0:=p32], 2:=X_s16v1[3][2][0:=p33], 3:=X_s16v1[3][3][0:=p34]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d339 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<8,&heap<13,0>[0]>>>> | | | | _tid = 8 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 2 | | | | row = 2 | | | | col = 0 | | | | result = 4 | | dyscope d338 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,2,0> | | dyscope d343 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d348 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d352 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=47, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=48, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d377] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d382] | | process p34(id=17) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d386] ample processes at state 1393: 4 5 6 7 8 9 10 11 12 13 14 15 16 State 1393 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=p21]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p22], 1:=X_s16v1[1][1][0:=p23], 2:=X_s16v1[1][2][0:=p24], 3:=X_s16v1[1][3][0:=p25]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p26], 1:=X_s16v1[2][1][0:=p27], 2:=X_s16v1[2][2][0:=p28], 3:=X_s16v1[2][3][0:=p29]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p30], 1:=X_s16v1[3][1][0:=p31], 2:=X_s16v1[3][2][0:=p32], 3:=X_s16v1[3][3][0:=p33]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d343 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<12,&heap<13,0>[0]>>>> | | | | _tid = 12 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 0 | | | | ty = 3 | | | | row = 3 | | | | col = 0 | | | | result = 4 | | dyscope d342 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<0,3,0> | | dyscope d348 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d352 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=45, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=46, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d377] | | process p33(id=16) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d382] ample processes at state 1400: 4 5 6 7 8 9 10 11 12 13 14 15 State 1400 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=p21], 1:=X_s16v1[1][1][0:=p22], 2:=X_s16v1[1][2][0:=p23], 3:=X_s16v1[1][3][0:=p24]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p25], 1:=X_s16v1[2][1][0:=p26], 2:=X_s16v1[2][2][0:=p27], 3:=X_s16v1[2][3][0:=p28]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p29], 1:=X_s16v1[3][1][0:=p30], 2:=X_s16v1[3][2][0:=p31], 3:=X_s16v1[3][3][0:=p32]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d348 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<1,&heap<13,0>[0]>>>> | | | | _tid = 1 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 0 | | | | row = 0 | | | | col = 1 | | | | result = 4 | | dyscope d347 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,0,0> | | dyscope d352 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=43, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=44, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] | | process p32(id=15) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d377] ample processes at state 1405: 4 5 6 7 8 9 10 11 12 13 14 State 1405 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=p21], 2:=X_s16v1[1][2][0:=p22], 3:=X_s16v1[1][3][0:=p23]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p24], 1:=X_s16v1[2][1][0:=p25], 2:=X_s16v1[2][2][0:=p26], 3:=X_s16v1[2][3][0:=p27]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p28], 1:=X_s16v1[3][1][0:=p29], 2:=X_s16v1[3][2][0:=p30], 3:=X_s16v1[3][3][0:=p31]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d352 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<5,&heap<13,0>[0]>>>> | | | | _tid = 5 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 1 | | | | row = 1 | | | | col = 1 | | | | result = 4 | | dyscope d351 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,1,0> | | dyscope d356 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=41, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=42, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] | | process p31(id=14) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d373] ample processes at state 1410: 4 5 6 7 8 9 10 11 12 13 State 1410 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=p21], 3:=X_s16v1[1][3][0:=p22]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p23], 1:=X_s16v1[2][1][0:=p24], 2:=X_s16v1[2][2][0:=p25], 3:=X_s16v1[2][3][0:=p26]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p27], 1:=X_s16v1[3][1][0:=p28], 2:=X_s16v1[3][2][0:=p29], 3:=X_s16v1[3][3][0:=p30]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d356 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<9,&heap<13,0>[0]>>>> | | | | _tid = 9 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 2 | | | | row = 2 | | | | col = 1 | | | | result = 4 | | dyscope d355 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,2,0> | | dyscope d360 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=39, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=40, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] | | process p30(id=13) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d369] ample processes at state 1415: 4 5 6 7 8 9 10 11 12 State 1415 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 1 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=p21]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p22], 1:=X_s16v1[2][1][0:=p23], 2:=X_s16v1[2][2][0:=p24], 3:=X_s16v1[2][3][0:=p25]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p26], 1:=X_s16v1[3][1][0:=p27], 2:=X_s16v1[3][2][0:=p28], 3:=X_s16v1[3][3][0:=p29]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d360 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<13,&heap<13,0>[0]>>>> | | | | _tid = 13 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 1 | | | | ty = 3 | | | | row = 3 | | | | col = 1 | | | | result = 4 | | dyscope d359 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<1,3,0> | | dyscope d365 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=37, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=38, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] | | process p29(id=12) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d365] ample processes at state 1422: 4 5 6 7 8 9 10 11 State 1422 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d369 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=35, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=36, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 1427: 4 5 6 7 8 9 10 State 1427 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1432: 4 5 6 7 8 9 State 1432 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1437: 4 5 6 7 8 State 1437 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1444: 4 5 6 7 State 1444 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] ample processes at state 1449: 4 5 6 State 1449 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=p21], 2:=X_s16v1[3][2][0:=p22], 3:=X_s16v1[3][3][0:=p23]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d386 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] ample processes at state 1454: 4 5 State 1454 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=UNDEFINED], 2:=X_s16v1[3][2][0:=p21], 3:=X_s16v1[3][3][0:=p22]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d390 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] Elapsed time in GPU (shared memory): 1 milliseconds 1 i = 0 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 1 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 2 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 3 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 4 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 5 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 6 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 7 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 8 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 9 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 10 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 11 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 12 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 13 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 14 cpu = 4, gpuGlobal = 4, gpuShared = 4 i = 15 cpu = 4, gpuGlobal = 4, gpuShared = 4 3 4 ample processes at state 1634: 4 6 State 1634 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=p21], 2:=X_s16v1[3][2][0:=p22], 3:=X_s16v1[3][3][0:=p23]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d386 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] ample processes at state 1644: 4 5 State 1644 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=UNDEFINED], 1:=X_s16v1[3][1][0:=p21], 2:=X_s16v1[3][2][0:=p22], 3:=X_s16v1[3][3][0:=p23]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d386 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack ample processes at state 1649: 4 6 7 State 1649 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] ample processes at state 1654: 4 7 State 1654 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] ample processes at state 1664: 4 6 State 1664 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack ample processes at state 1669: 4 5 7 State 1669 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] ample processes at state 1674: 4 5 State 1674 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack ample processes at state 1679: 4 5 6 State 1679 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 3 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=UNDEFINED]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p21], 1:=X_s16v1[3][1][0:=p22], 2:=X_s16v1[3][2][0:=p23], 3:=X_s16v1[3][3][0:=p24]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d382 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack ample processes at state 1684: 4 6 7 8 State 1684 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1691: 4 7 8 State 1691 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1698: 4 8 State 1698 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1712: 4 7 State 1712 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack ample processes at state 1719: 4 6 8 State 1719 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1726: 4 6 State 1726 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack ample processes at state 1733: 4 6 7 State 1733 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack ample processes at state 1740: 4 5 7 8 State 1740 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1747: 4 5 8 State 1747 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1754: 4 5 State 1754 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack ample processes at state 1761: 4 5 7 State 1761 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack ample processes at state 1768: 4 5 6 8 State 1768 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] ample processes at state 1775: 4 5 6 State 1775 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack ample processes at state 1782: 4 5 6 7 State 1782 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 3 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=UNDEFINED], 3:=X_s16v1[2][3][0:=p21]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p22], 1:=X_s16v1[3][1][0:=p23], 2:=X_s16v1[3][2][0:=p24], 3:=X_s16v1[3][3][0:=p25]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d377 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack ample processes at state 1789: 4 6 7 8 9 State 1789 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1794: 4 7 8 9 State 1794 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1799: 4 8 9 State 1799 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1804: 4 9 State 1804 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1814: 4 8 State 1814 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1819: 4 7 9 State 1819 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1824: 4 7 State 1824 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1829: 4 7 8 State 1829 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1834: 4 6 8 9 State 1834 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1839: 4 6 9 State 1839 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1844: 4 6 State 1844 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1849: 4 6 8 State 1849 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1854: 4 6 7 9 State 1854 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1859: 4 6 7 State 1859 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1864: 4 6 7 8 State 1864 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1869: 4 5 7 8 9 State 1869 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1874: 4 5 8 9 State 1874 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1879: 4 5 9 State 1879 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1884: 4 5 State 1884 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1889: 4 5 8 State 1889 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1894: 4 5 7 9 State 1894 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1899: 4 5 7 State 1899 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1904: 4 5 7 8 State 1904 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1909: 4 5 6 8 9 State 1909 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1914: 4 5 6 9 State 1914 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1919: 4 5 6 State 1919 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1924: 4 5 6 8 State 1924 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1929: 4 5 6 7 9 State 1929 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] ample processes at state 1934: 4 5 6 7 State 1934 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack ample processes at state 1939: 4 5 6 7 8 State 1939 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 2 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=UNDEFINED], 2:=X_s16v1[2][2][0:=p21], 3:=X_s16v1[2][3][0:=p22]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p23], 1:=X_s16v1[3][1][0:=p24], 2:=X_s16v1[3][2][0:=p25], 3:=X_s16v1[3][3][0:=p26]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d373 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack ample processes at state 1944: 4 6 7 8 9 10 State 1944 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1949: 4 7 8 9 10 State 1949 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1954: 4 8 9 10 State 1954 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1959: 4 9 10 State 1959 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1964: 4 10 State 1964 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1974: 4 9 State 1974 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 1979: 4 8 10 State 1979 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1984: 4 8 State 1984 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 1989: 4 8 9 State 1989 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 1994: 4 7 9 10 State 1994 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 1999: 4 7 10 State 1999 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2004: 4 7 State 2004 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2009: 4 7 9 State 2009 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2014: 4 7 8 10 State 2014 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2019: 4 7 8 State 2019 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2024: 4 7 8 9 State 2024 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2029: 4 6 8 9 10 State 2029 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2034: 4 6 9 10 State 2034 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2039: 4 6 10 State 2039 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2044: 4 6 State 2044 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2049: 4 6 9 State 2049 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2054: 4 6 8 10 State 2054 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2059: 4 6 8 State 2059 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2064: 4 6 8 9 State 2064 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2069: 4 6 7 9 10 State 2069 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2074: 4 6 7 10 State 2074 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2079: 4 6 7 State 2079 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2084: 4 6 7 9 State 2084 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2089: 4 6 7 8 10 State 2089 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2094: 4 6 7 8 State 2094 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2099: 4 6 7 8 9 State 2099 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2104: 4 5 7 8 9 10 State 2104 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2109: 4 5 8 9 10 State 2109 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2114: 4 5 9 10 State 2114 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2119: 4 5 10 State 2119 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2124: 4 5 State 2124 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2129: 4 5 9 State 2129 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2134: 4 5 8 10 State 2134 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2139: 4 5 8 State 2139 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2144: 4 5 8 9 State 2144 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2149: 4 5 7 9 10 State 2149 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2154: 4 5 7 10 State 2154 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2159: 4 5 7 State 2159 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2164: 4 5 7 9 State 2164 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2169: 4 5 7 8 10 State 2169 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2174: 4 5 7 8 State 2174 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2179: 4 5 7 8 9 State 2179 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2184: 4 5 6 8 9 10 State 2184 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2189: 4 5 6 9 10 State 2189 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2194: 4 5 6 10 State 2194 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2199: 4 5 6 State 2199 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2204: 4 5 6 9 State 2204 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2209: 4 5 6 8 10 State 2209 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2214: 4 5 6 8 State 2214 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2219: 4 5 6 8 9 State 2219 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2224: 4 5 6 7 9 10 State 2224 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2229: 4 5 6 7 10 State 2229 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2234: 4 5 6 7 State 2234 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2239: 4 5 6 7 9 State 2239 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2244: 4 5 6 7 8 10 State 2244 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] ample processes at state 2249: 4 5 6 7 8 State 2249 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack ample processes at state 2254: 4 5 6 7 8 9 State 2254 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 1 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=UNDEFINED], 1:=X_s16v1[2][1][0:=p21], 2:=X_s16v1[2][2][0:=p22], 3:=X_s16v1[2][3][0:=p23]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p24], 1:=X_s16v1[3][1][0:=p25], 2:=X_s16v1[3][2][0:=p26], 3:=X_s16v1[3][3][0:=p27]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d369 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<6,&heap<13,0>[0]>>>> | | | | _tid = 6 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 1 | | | | row = 1 | | | | col = 2 | | | | result = 4 | | dyscope d368 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,1,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d335] | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack ample processes at state 2259: 4 6 7 8 9 10 11 State 2259 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d373 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<10,&heap<13,0>[0]>>>> | | | | _tid = 10 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 2 | | | | row = 2 | | | | col = 2 | | | | result = 4 | | dyscope d372 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,2,0> | | dyscope d377 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=33, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=34, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d339] | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2264: 4 7 8 9 10 11 State 2264 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d382 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=31, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=32, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2269: 4 8 9 10 11 State 2269 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2274: 4 9 10 11 State 2274 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2279: 4 10 11 State 2279 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2284: 4 11 State 2284 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d394 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2294: 4 10 State 2294 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d390 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack ample processes at state 2299: 4 9 11 State 2299 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2304: 4 9 State 2304 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack ample processes at state 2309: 4 9 10 State 2309 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d386 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack ample processes at state 2314: 4 8 10 11 State 2314 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2319: 4 8 11 State 2319 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2324: 4 8 State 2324 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack ample processes at state 2329: 4 8 10 State 2329 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack ample processes at state 2334: 4 8 9 11 State 2334 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2339: 4 8 9 State 2339 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack ample processes at state 2344: 4 8 9 10 State 2344 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d382 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<3,&heap<13,0>[0]>>>> | | | | _tid = 3 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 0 | | | | row = 0 | | | | col = 3 | | | | result = 4 | | dyscope d381 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,0,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | process p25(id=8) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d348] | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack ample processes at state 2349: 4 7 9 10 11 State 2349 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=29, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=30, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2354: 4 7 10 11 State 2354 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2359: 4 7 11 State 2359 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d394 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2364: 4 7 State 2364 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack ample processes at state 2369: 4 7 10 State 2369 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d390 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack ample processes at state 2374: 4 7 9 11 State 2374 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d394 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<15,&heap<13,0>[0]>>>> | | | | _tid = 15 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 3 | | | | row = 3 | | | | col = 3 | | | | result = 4 | | dyscope d393 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,3,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d360] ample processes at state 2379: 4 7 9 State 2379 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | process p28(id=11) | | | call stack ample processes at state 2384: 4 7 9 10 State 2384 | Path condition | | (0 <= SIZEOF_REAL+-1) && (0 <= SIZEOF(dynamicType<226>)+-1) && (0 <= SIZEOF(dynamicType<241>)+-1) && (0 <= SIZEOF(dynamicType<79>)+-1) && (0 <= SIZEOF(dynamicType<230>)+-1) && (0 <= SIZEOF(dynamicType<221>)+-1) | Dynamic scopes | | dyscope d0 (id=0, parent=d0, static=0) | | | variables | | | | __heap = $heap<(__struct_2__[3][])],H_p0s6v0i0l1[0:=__struct_2__],H_p0s6v0i0l2[0:=__struct_2__]>,(_kernelInstanceNode_[3][])heap<0,0>[0],NULL>],H_p0s6v0i1l1[0:=_kernelInstanceNode_<&heap<0,1>[0],&heap<1,0>[0]>],H_p0s6v0i1l2[0:=_kernelInstanceNode_<&heap<0,2>[0],&heap<1,1>[0]>]>,(__struct_3__[1][])heap<1,2>[0],true>]>,(pointer[7][])heap<0,1>[0]],H_p0s4v0i3l5[0:=&heap<0,1>[0]],UNDEFINED>,(__struct_4__[4][])heap<3,5>[0],1>],H_p0s4v0i4l1[0:=__struct_4__<&heap<3,4>[0],1>],UNDEFINED,UNDEFINED>,(pointer[0][])>,(pointer[0][])>,(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(real[1][]),(__gbarrier__[0][])>,(__barrier__[0][])>> | | | | __argc = X_s0v2 | | | | _context = __struct_5__heap<2,0>[0],0> | | | | N = 4 | | | | TILE_WIDTH = 4 | | | | _anon_0 = "1\n" | | | | _anon_1 = "2\n" | | | | _anon_2 = NULL | | | | _anon_3 = NULL | | dyscope d9 (id=1, parent=d0, static=72) | | | variables | | | | A = X_s1v1[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | B = X_s1v2[0:=1, 1:=1, 2:=1, 3:=1, 4:=1, 5:=1, 6:=1, 7:=1, 8:=1, 9:=1, 10:=1, 11:=1, 12:=1, 13:=1, 14:=1, 15:=1] | | | | C = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | cpuResult = X_s1v3[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuGlobalResult = H_p0s1v0i9l0[0:=4, 1:=4, 2:=4, 3:=4, 4:=4, 5:=4, 6:=4, 7:=4, 8:=4, 9:=4, 10:=4, 11:=4, 12:=4, 13:=4, 14:=4, 15:=4] | | | | gpuSharedResult = X_s1v6 | | | | r = 4 | | | | c = 4 | | | | G_A = &heap<10,0>[0] | | | | G_B = &heap<11,0>[0] | | | | G_C = &heap<12,0>[0] | | | | size_a = 16 | | | | size_b = 16 | | | | size_c = 16 | | | | start = &heap<4,0>[0] | | | | stop = &heap<4,1>[0] | | | | CPU_elapsedtime = 1 | | | | GPU_global_elapsedtime = 1 | | | | GPU_shared_elapsedtime = NULL | | | | _anon_4 = " speedup\n" | | | | _anon_5 = " -------\n" | | | | _anon_6 = "Elapsed time in CPU: %7.1f milliseconds\n" | | | | block = __struct_0__<4,4,1> | | | | grid = __struct_0__<1,1,1> | | | | _anon_7 = "Elapsed time in GPU (global memory): %7.1f milliseconds %5.1f\n" | | | | _anon_8 = "a\n" | | | | _anon_9 = "b\n" | | | | _anon_10 = NULL | | dyscope d8 (id=2, parent=d0, static=48) | | | variables | | dyscope d304 (id=3, parent=d0, static=44) | | | variables | | | | dst = &C[0] | | | | src = &heap<12,0>[0] | | | | count = 16*SIZEOF_REAL | | | | kind = 2 | | dyscope d56 (id=4, parent=d0, static=43) | | | variables | | dyscope d60 (id=5, parent=d0, static=61) | | | variables | | | | mostRecentInstance = &heap<0,2>[0] | | dyscope d59 (id=6, parent=d0, static=24) | | | variables | | | | s = &heap<2,0>[0] | | dyscope d302 (id=7, parent=d0, static=71) | | | variables | | | | this = &heap<0,2>[0] | | | | e = &heap<4,3>[0] | | dyscope d290 (id=8, parent=d0, static=47) | | | variables | | | | gridDim = __struct_0__<1,1,1> | | | | blockDim = __struct_0__<4,4,1> | | | | s = NULL | | | | A = &heap<10,0>[0] | | | | B = &heap<11,0>[0] | | | | C = &heap<12,0>[0] | | | | width = 4 | | dyscope d323 (id=9, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d322 (id=10, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d321 (id=11, parent=d0, static=55) | | | variables | | | | x = 0 | | dyscope d314 (id=12, parent=d0, static=50) | | | variables | | | | procs = X_s9v1[0:=X_s9v1[0][0:=X_s9v1[0][0][0:=p20]]] | | dyscope d313 (id=13, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<1,1,1> | | | | procFn = &(function)_block | | dyscope d320 (id=14, parent=d0, static=81) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[1][])<(__gbarrier__[1])<__gbarrier__<16,(process[16]),(boolean[16]),0>>>,(__barrier__[0][])>> | | | | _numThreads = 16 | | | | _block_barrier = &heap<13,0>[0] | | | | A_shared = X_s14v3[0:=X_s14v3[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v3[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v3[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v3[3][0:=1, 1:=1, 2:=1, 3:=1]] | | | | B_shared = X_s14v4[0:=X_s14v4[0][0:=1, 1:=1, 2:=1, 3:=1], 1:=X_s14v4[1][0:=1, 1:=1, 2:=1, 3:=1], 2:=X_s14v4[2][0:=1, 1:=1, 2:=1, 3:=1], 3:=X_s14v4[3][0:=1, 1:=1, 2:=1, 3:=1]] | | dyscope d319 (id=15, parent=d0, static=78) | | | variables | | | | blockIdx = __struct_1__<0,0,0> | | dyscope d397 (id=16, parent=d0, static=57) | | | variables | | | | z = 0 | | dyscope d396 (id=17, parent=d0, static=56) | | | variables | | | | y = 0 | | dyscope d395 (id=18, parent=d0, static=55) | | | variables | | | | x = 2 | | dyscope d325 (id=19, parent=d0, static=50) | | | variables | | | | procs = X_s16v1[0:=X_s16v1[0][0:=X_s16v1[0][0][0:=UNDEFINED], 1:=X_s16v1[0][1][0:=UNDEFINED], 2:=X_s16v1[0][2][0:=UNDEFINED], 3:=X_s16v1[0][3][0:=UNDEFINED]], 1:=X_s16v1[1][0:=X_s16v1[1][0][0:=UNDEFINED], 1:=X_s16v1[1][1][0:=UNDEFINED], 2:=X_s16v1[1][2][0:=UNDEFINED], 3:=X_s16v1[1][3][0:=UNDEFINED]], 2:=X_s16v1[2][0:=X_s16v1[2][0][0:=p21], 1:=X_s16v1[2][1][0:=p22], 2:=X_s16v1[2][2][0:=p23], 3:=X_s16v1[2][3][0:=p24]], 3:=X_s16v1[3][0:=X_s16v1[3][0][0:=p25], 1:=X_s16v1[3][1][0:=p26], 2:=X_s16v1[3][2][0:=p27], 3:=X_s16v1[3][3][0:=p28]]] | | dyscope d324 (id=20, parent=d0, static=17) | | | variables | | | | dim = __struct_0__<4,4,1> | | | | procFn = &(function)_thread | | dyscope d365 (id=21, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<2,&heap<13,0>[0]>>>> | | | | _tid = 2 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 0 | | | | row = 0 | | | | col = 2 | | | | result = 4 | | dyscope d364 (id=22, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,0,0> | | dyscope d377 (id=23, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<14,&heap<13,0>[0]>>>> | | | | _tid = 14 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 2 | | | | ty = 3 | | | | row = 3 | | | | col = 2 | | | | result = 4 | | dyscope d376 (id=24, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<2,3,0> | | dyscope d386 (id=25, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<7,&heap<13,0>[0]>>>> | | | | _tid = 7 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 1 | | | | row = 1 | | | | col = 3 | | | | result = 4 | | dyscope d385 (id=26, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,1,0> | | dyscope d390 (id=27, parent=d0, static=85) | | | variables | | | | __heap = $heap<(__struct_2__[0][])>,(_kernelInstanceNode_[0][])>,(__struct_3__[0][])>,(pointer[0][])>,(__struct_4__[0][])>,(pointer[0][])>,(pointer[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(real[0][])>,(__gbarrier__[0][])>,(__barrier__[1][])<(__barrier__[1])<__barrier__<11,&heap<13,0>[0]>>>> | | | | _tid = 11 | | | | _b = &heap<14,0>[0] | | | | bx = 0 | | | | by = 0 | | | | tx = 3 | | | | ty = 2 | | | | row = 2 | | | | col = 3 | | | | result = 4 | | dyscope d389 (id=28, parent=d0, static=82) | | | variables | | | | threadIdx = __struct_1__<3,2,0> | Process states | | process p0(id=0) | | | call stack | | | | Frame[function=_streamWait, location=72, f3:226.64-65 ";", dyscope=d60] | | | | Frame[function=cudaDeviceSynchronize, location=169, f3:435.4-15 "_streamWait", dyscope=d56] | | | | Frame[function=cudaMemcpy, location=171, f3:463.4-25 "cudaDeviceSynchronize", dyscope=d304] | | | | Frame[function=_main, location=252, f0:264.2-12 "cudaMemcpy", dyscope=d9] | | | | Frame[function=_CIVL_system, location=9, f0:303.4-9 "_main", dyscope=d0] | | process p1(id=1) | | | call stack | | process p19(id=2) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d323] | | | | Frame[function=_kernel, location=279, f0:127.8-17 "_runProcs", dyscope=d302] | | process p20(id=3) | | | call stack | | | | Frame[function=_runProcs, location=43, f3:125.4-9 "$wait", dyscope=d397] | | | | Frame[function=_block, location=291, f0:124.12-21 "_runProcs", dyscope=d320] | | process p21(id=4) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d331] | | process p22(id=5) | | | call stack | | process p23(id=6) | | | call stack | | process p24(id=7) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d343] | | process p25(id=8) | | | call stack | | process p26(id=9) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d352] | | process p27(id=10) | | | call stack | | | | Frame[function=_thread, location=326, f0:121.16-32 "C[row*width+col]", dyscope=d356] | | process p28(id=11) | | | call stack