用“进程”或“线程”策略将独立块填充到全局数组中？

from multiprocessing.dummy import Pool as ThreadPool ## discretization along x-axis and y-axis for each block arrayCross_k = np.linspace(kMIN, kMAX, dimPoints) arrayCross_mu = np.linspace(-1, 1, dimPoints) # Build all big matrix with N total blocks = dimBlock*dimBlock = 16 here arrayFullCross = np.zeros((dimBlocks, dimBlocks, arrayCross_k.size, arrayCross_mu.size)) dimBlocks = 4 # Size of dimension along k and mu axis dimPoints = 100 # dimension along one dimension of global arrayFullCross dimMatCovCross = dimBlocks*dimPoints # Build cross-correlation matrix def buildCrossMatrix_loop(params_array): # rows indices xb = params_array[0] # columns indices yb = params_array[1] # Current redshift z = zrange[params_array[2]] # Loop inside block for ub in range(dimPoints): for vb in range(dimPoints): # Diagonal blocs if (xb == yb): # Fill the (xb,yb) su-block of global array by arrayFullCross[xb][xb][ub][vb] = 2*P_obs_cross(arrayCross_k[ub], arrayCross_mu[vb] , z, 10**P_m(np.log10(arrayCross_k[ub])), ... ... # End of function buildCrossMatrix_loop # Main loop while i < len(zrange): def generatorCrossMatrix(index): for igen in range(dimBlocks): for lgen in range(dimBlocks): yield igen, lgen, index if __name__ == '__main__': # Use 20 threads pool = ThreadPool(20) pool.map(buildCrossMatrix_loop, generatorCrossMatrix(i)) # Increment index "i" i = i+1

from multiprocessing import Process # Main loop on z range while i < len(zrange): params_p = [] for ip in range(4): for jp in range(4): params_p.append(ip) params_p.append(jp) params_p.append(i) p = Process(target=buildCrossMatrix_loop, args=(params_p,)) params_p = [] p.start() # Finished : wait everybody p.join() ... ... i = i+1 # End of main while loop

# Build cross-correlation matrix def buildCrossMatrix_loop(params_array): # rows indices xb = params_array[0] # columns indices yb = params_array[1] # Current redshift z = zrange[params_array[2]] # Loop inside block for ub in range(dimPoints): for vb in range(dimPoints): # Diagonal blocs if (xb == yb): arrayFullCross[xb][xb][ub][vb] = 2*P_obs_cross(arrayCross_k[ub], arrayCross_mu[vb]) ... ... #others assignments on arrayFullCross elements # Return global array to main process return arrayFullCross

if __name__ == '__main__': pool = Pool(16) outputArray = pool.map(buildCrossMatrix_loop, generatorCrossMatrix(i)) pool.terminate() ## Print outputArray print 'outputArray = ', outputArray ## Reshape 4D outputArray to 2D array arrayFullCross2D_swap = np.array(outputArray).swapaxes(1,2).reshape(dimMatCovCross,dimMatCovCross)

1条回答

网友
1楼 · 发布于 2024-09-27 18:09:14

首先，我认为multiprocessing.ThreadPool是一个私有API，所以应该避免使用它。现在multiprocessing.dummy是一个无用的模块。它不做任何多线程/处理，这就是为什么你看不到任何好处。您应该使用“plain”multiprocessing模块。你知道吗
第二个代码不起作用，因为它使用多个进程。进程不共享内存，因此在子进程中所做的更改不会反映在其他子进程或主进程中。您可以：
返回值并在主进程中将它们组合在一起，例如使用multiprocessing.Pool.map
使用threading而不是multiprocessing: just replace导入多处理with导入线程and多处理过程with穿线。穿线`代码应该有用。你知道吗
请注意，threading版本将只工作，因为numpy在计算期间释放GIL，否则它将被卡在1个CPU上。你知道吗
你可能想看看几分钟前的this similar question，它是I answered。你知道吗

相关问题更多 >

编程相关推荐

热门问题

热门文章