有没有办法优化我的列表理解以获得更好的性能？它比for循环慢

def asc_process_single(self, asc_array, asc_info, skip=1): # ncols = asc_info['ncols'] nrows = asc_info['nrows'] xllcornor = asc_info['xllcornor'] yllcornor = asc_info['yllcornor'] cellsize = asc_info['cellsize'] nodata_value = asc_info['nodata_value'] raster_size_y = cellsize*nrows # raster_size_x = cellsize*ncols # Looping over array rows and cols with skipping xyz = [] for row in range(asc_array.shape[0])[::skip]: for col in range(asc_array.shape[1])[::skip]: val_z = asc_array[row, col] # Z value of datapoint # The no data value is not processed if val_z == nodata_value: pass else: # Xcoordinate for current Z value val_x = xllcornor + (col * cellsize) # Ycoordinate for current Z value val_y = yllcornor + raster_size_y - (row * cellsize) # x, y, z to LIST xyz.append([val_x, val_y, val_z]) return xyz

def asc_process_single_listcomprehension(self, asc_array, asc_info, skip=1): # ncols = asc_info['ncols'] nrows = asc_info['nrows'] xllcornor = asc_info['xllcornor'] yllcornor = asc_info['yllcornor'] cellsize = asc_info['cellsize'] nodata_value = asc_info['nodata_value'] raster_size_y = cellsize*nrows # raster_size_x = cellsize*ncols # Looping over array rows and cols with skipping rows = range(asc_array.shape[0])[::skip] cols = range(asc_array.shape[1])[::skip] xyz = [[xllcornor + (col * cellsize), yllcornor + raster_size_y - (row * cellsize), asc_array[row, col]] for row in rows for col in cols if asc_array[row, col] != nodata_value] return xyz

xyz = [[xllcornor + (col * cellsize), yllcornor + raster_size_y - (row * cellsize), val_z] for row in rows for col in cols for val_z in [asc_array[row, col]] if val_z != nodata_value]

def asc_process_numpy_single(self, asc_array, asc_info, skip): # ncols = asc_info['ncols'] nrows = asc_info['nrows'] xllcornor = asc_info['xllcornor'] yllcornor = asc_info['yllcornor'] cellsize = asc_info['cellsize'] nodata_value = asc_info['nodata_value'] raster_size_y = cellsize*nrows # raster_size_x = cellsize*ncols rows = np.arange(0,asc_array.shape[0],skip)[:,np.newaxis] cols = np.arange(0,asc_array.shape[1],skip) x = np.zeros((len(rows),len(cols))) + xllcornor + (cols * cellsize) y = np.zeros((len(rows),len(cols))) + yllcornor + raster_size_y - (rows * cellsize) z = asc_array[::skip,::skip] xyz = np.asarray([x,y,z]).T.transpose((1,0,2)).reshape( (int(len(rows)*len(cols)), 3) ) mask = (xyz[:,2] != nodata_value) xyz = xyz[mask] return xyz

609 ms ± 44.8 ms per loop (mean ± std. dev. of 10 runs, 1 loop each) 706 ms ± 22 ms per loop (mean ± std. dev. of 10 runs, 1 loop each) 604 ms ± 21.5 ms per loop (mean ± std. dev. of 10 runs, 1 loop each) 70.4 ms ± 1.26 ms per loop (mean ± std. dev. of 10 runs, 1 loop each)

2条回答

网友

1楼 · 编辑于 2024-09-22 16:38:55

我能想象到的唯一一件让您慢下来的事情是，在原始代码中，您将asc_array[row, col]放入一个临时变量，而在列表理解中，您对它求值两次

您可能想尝试两件事：

使用walrus运算符在“if”语句中为val_z赋值，或
在另外两个for之后添加for val_z in [asc_array[row, col]]

祝你好运

网友

2楼 · 编辑于 2024-09-22 16:38:55

是的，两次评估阵列会增加计算时间。以下是我的测试用例：

def funLoop(A):
    xyz = []
    for row in range(A.shape[0]):
        for col in range(A.shape[1]):
            xyz.append([col, row, A[row, col] ])
            
def funListComp1(A):
    xyz = [ [col, row, A[row, col] ] 
           for row in range(A.shape[0]) for col in range(A.shape[1])]

def funListComp2(A):
    xyz = [ [col, A[row, col], A[row, col] ] 
           for row in range(A.shape[0]) for col in range(A.shape[1])]
    
A = np.random.rand(1000,1000)
%timeit funLoop(A)
%timeit funListComp1(A)
%timeit funListComp2(A)

457 ms ± 70.6 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
378 ms ± 8.89 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
779 ms ± 309 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

对于大数据，对于循环，您应该始终更喜欢使用numpy而不是python。在您的情况下，numpy代码看起来有点像：

def asc_process_single_numpy(asc_array):
    nodata_value = np.nan
    raster_size_y = 1
    skip = 2
    xllcornor = 0
    yllcornor = 0
    cellsize  = 1
    rows = np.arange(0,asc_array.shape[0],skip)[:,np.newaxis]
    cols = np.arange(0,asc_array.shape[1],skip)

    #for row in rows for col in cols
    x = np.zeros((len(rows),len(cols))) + xllcornor + (cols * cellsize)
    y = np.zeros((len(rows),len(cols))) + yllcornor + raster_size_y - (rows * cellsize)
    z = asc_array[::skip,::skip]
    return np.asarray([x,y,z]).T.transpose((1,0,2)).reshape( (int(len(rows)*len(cols)), 3) )

A = np.random.rand(1000,1000)
%timeit asc_process_single(A)
%timeit asc_process_single_listcomprehension(A)
%timeit asc_process_single_numpy(A)

183 ms ± 13 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
210 ms ± 2.05 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
11.3 ms ± 222 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)

相关问题更多 >

编程相关推荐

热门问题

热门文章