Professional Documents
Culture Documents
GPU - LAB - Ipynb - Colaboratory
GPU - LAB - Ipynb - Colaboratory
1 import cupy as cp
1 import numpy as np
1 n = 50
2 A = np.random.randint(0, 255, size=(n, n))
3 B = np.random.randint(0, 255, size=(n, n))
4 C = np.random.randint(0, 255, size=(n, n))
1 A_gpu = cp.random.randint(0, 255, size=(n, n))
2 B_gpu = cp.random.randint(0, 255, size=(n, n))
3 C_gpu = cp.random.randint(0, 255, size=(n, n))
1 %%timeit
2 A_dash = np.dot(A, A+B) + C
112 µs ± 22.1 µs per loop (mean ± std. dev. of 7 runs, 10000 loops each)
1 %%timeit
2 A_dash_gpu = cp.dot(A_gpu, A_gpu + B_gpu) + C_gpu
1 n = 500
2 A = np.random.randint(0, 255, size=(n, n))
3 B = np.random.randint(0, 255, size=(n, n))
4 C = np.random.randint(0, 255, size=(n, n))
1 A_gpu = cp.random.randint(0, 255, size=(n, n))
2 B_gpu = cp.random.randint(0, 255, size=(n, n))
3 C_gpu = cp.random.randint(0, 255, size=(n, n))
1 %%timeit
2 A_dash = np.dot(A, A+B) + C
167 ms ± 25.8 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
1 %%timeit
2 A_dash_gpu = cp.dot(A_gpu, A_gpu + B_gpu) + C_gpu
479 µs ± 461 ns per loop (mean ± std. dev. of 7 runs, 1000 loops each)
1 n = 2000
1 of 2 4/17/23, 3:39 PM
GPU_LAB.ipynb - Colaboratory https://colab.research.google.com/drive/1222GuvwsBst...
1 A_gpu = cp.random.randint(0, 255, size=(n, n))
2 B_gpu = cp.random.randint(0, 255, size=(n, n))
3 C_gpu = cp.random.randint(0, 255, size=(n, n))
1 %%timeit
2 A_dash = np.dot(A, A+B) + C
12.9 s ± 640 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
1 %%timeit
2 A_dash_gpu = cp.dot(A_gpu, A_gpu + B_gpu) + C_gpu
14.7 ms ± 322 µs per loop (mean ± std. dev. of 7 runs, 1000 loops each)
2 of 2 4/17/23, 3:39 PM