Python中的并行CPU求和

import numpy as np import concurrent.futures import time, random from concurrent.futures import ThreadPoolExecutor import threading #parameters dWhy = np.random.sample(300) dby = np.random.sample(300) def Func(ps, targets, hs, t): global dWhy, dby dy = np.copy(ps[t]) dWhy += np.dot(dy, hs[t].T) dby += dy return dWhy, dby if __name__ == '__main__': ps = np.random.sample(100000) targets = np.random.sample(100000) hs = np.random.sample(100000) start = time.time() for t in range(100000): dy = np.copy(ps[t]) dWhy += np.dot(dy, hs[t].T) dby += dy finish = time.time() print("One thread: ") print(finish-start) dWhy = np.random.sample(300) dby = np.random.sample(300) start = time.time() with concurrent.futures.ThreadPoolExecutor() as executor: args = ((ps, targets, hs, t) for t in range(100000)) for out1, out2 in executor.map(lambda p: Func(*p), args): dWhy, dby = out1, out2 finish = time.time() print("Multithreads time: ") print(finish-start)

2条回答

网友

1楼 · 编辑于 2024-07-01 08:24:02

考虑用广播代替：

import numpy as np
dWhy = np.random.sample(300)
dby = np.random.sample(300)

ps = np.random.sample(100000)
targets = np.random.sample(100000)
hs = np.random.sample(100000)

dWhy += np.dot(ps,hs)
dby += np.sum(ps)

当它跑快20000倍的时候

timer = time.time()
for i in range(20000):
    dWhy += np.dot(ps,hs)
    dby += np.sum(ps)
print(time.time()-timer)
>>3.2034592628479004
print(time.time()-timer)/20000)
>>0.00016017296314239503

网友

2楼 · 编辑于 2024-07-01 08:24:02

将lambda转换为命名函数。你知道吗

相关问题更多 >

编程相关推荐

热门问题

热门文章