ai-content-maker/.venv/Lib/site-packages/numba/cuda/tests/cudapy/test_globals.py

import numpy as np
from numba import cuda, int32, float32
from numba.cuda.testing import unittest, CUDATestCase

N = 100


def simple_smem(ary):
    sm = cuda.shared.array(N, int32)
    i = cuda.grid(1)
    if i == 0:
        for j in range(N):
            sm[j] = j
    cuda.syncthreads()
    ary[i] = sm[i]


S0 = 10
S1 = 20


def coop_smem2d(ary):
    i, j = cuda.grid(2)
    sm = cuda.shared.array((S0, S1), float32)
    sm[i, j] = (i + 1) / (j + 1)
    cuda.syncthreads()
    ary[i, j] = sm[i, j]


class TestCudaTestGlobal(CUDATestCase):
    def test_global_int_const(self):
        """Test simple_smem
        """
        compiled = cuda.jit("void(int32[:])")(simple_smem)

        nelem = 100
        ary = np.empty(nelem, dtype=np.int32)
        compiled[1, nelem](ary)

        self.assertTrue(np.all(ary == np.arange(nelem, dtype=np.int32)))

    @unittest.SkipTest
    def test_global_tuple_const(self):
        """Test coop_smem2d
        """
        compiled = cuda.jit("void(float32[:,:])")(coop_smem2d)

        shape = 10, 20
        ary = np.empty(shape, dtype=np.float32)
        compiled[1, shape](ary)

        exp = np.empty_like(ary)
        for i in range(ary.shape[0]):
            for j in range(ary.shape[1]):
                exp[i, j] = float(i + 1) / (j + 1)
        self.assertTrue(np.allclose(ary, exp))


if __name__ == '__main__':
    unittest.main()
first commit 2024-05-03 04:18:51 +03:00			`import numpy as np`
			`from numba import cuda, int32, float32`
			`from numba.cuda.testing import unittest, CUDATestCase`

			`N = 100`


			`def simple_smem(ary):`
			`sm = cuda.shared.array(N, int32)`
			`i = cuda.grid(1)`
			`if i == 0:`
			`for j in range(N):`
			`sm[j] = j`
			`cuda.syncthreads()`
			`ary[i] = sm[i]`


			`S0 = 10`
			`S1 = 20`


			`def coop_smem2d(ary):`
			`i, j = cuda.grid(2)`
			`sm = cuda.shared.array((S0, S1), float32)`
			`sm[i, j] = (i + 1) / (j + 1)`
			`cuda.syncthreads()`
			`ary[i, j] = sm[i, j]`


			`class TestCudaTestGlobal(CUDATestCase):`
			`def test_global_int_const(self):`
			`"""Test simple_smem`
			`"""`
			`compiled = cuda.jit("void(int32[:])")(simple_smem)`

			`nelem = 100`
			`ary = np.empty(nelem, dtype=np.int32)`
			`compiled[1, nelem](ary)`

			`self.assertTrue(np.all(ary == np.arange(nelem, dtype=np.int32)))`

			`@unittest.SkipTest`
			`def test_global_tuple_const(self):`
			`"""Test coop_smem2d`
			`"""`
			`compiled = cuda.jit("void(float32[:,:])")(coop_smem2d)`

			`shape = 10, 20`
			`ary = np.empty(shape, dtype=np.float32)`
			`compiled[1, shape](ary)`

			`exp = np.empty_like(ary)`
			`for i in range(ary.shape[0]):`
			`for j in range(ary.shape[1]):`
			`exp[i, j] = float(i + 1) / (j + 1)`
			`self.assertTrue(np.allclose(ary, exp))`


			`if __name__ == '__main__':`
			`unittest.main()`