Documenti di Didattica
Documenti di Professioni
Documenti di Cultura
In [91]: a = np.random.random(10**7).astype(np.float64)
b = np.random.random(10**7).astype(np.float64)
263 ms ś 26.9 ms per loop (mean ś std. dev. of 7 runs, 1 loop each)
47.3 ms ś 957 ţs per loop (mean ś std. dev. of 7 runs, 10 loops each)
126 ms ś 8.95 ms per loop (mean ś std. dev. of 7 runs, 1 loop each)
1
In [98]: @vectorize(["float32,float32"], target='cuda')
def cuda_VectorAdd(a, b):
return a + b
@vectorize(["float32,float32"], target='parallel')
def parallel_VectorAdd(a, b):
return a + b
@vectorize(["float32,float32"], target='cpu')
def cpu_VectorAdd(a, b):
return a + b
def cuda_calc1():
N = 32000000
A = np.ones(N, dtype=np.float32)
B = np.ones(N, dtype=np.float32)
C = np.zeros(N, dtype=np.float32)
C = cuda_VectorAdd(A, B)
def par_calc1():
N = 32000000
A = np.ones(N, dtype=np.float32)
B = np.ones(N, dtype=np.float32)
C = np.zeros(N, dtype=np.float32)
C = parallel_VectorAdd(A, B)
def cpu_calc1():
N = 32000000
A = np.ones(N, dtype=np.float32)
B = np.ones(N, dtype=np.float32)
C = np.zeros(N, dtype=np.float32)
C = cpu_VectorAdd(A, B)
328 ms ś 16.8 ms per loop (mean ś std. dev. of 7 runs, 1 loop each)
194 ms ś 6.4 ms per loop (mean ś std. dev. of 7 runs, 1 loop each)
234 ms ś 14.3 ms per loop (mean ś std. dev. of 7 runs, 1 loop each)
1 Resultat