import pyshader as ps import kp import numpy as np def test_array_multiplication(): # 1. Create Kompute Manager (selects device 0 by default) mgr = kp.Manager() # 2. Create Kompute Tensors to hold data tensor_in_a = kp.Tensor([2, 2, 2]) tensor_in_b = kp.Tensor([1, 2, 3]) tensor_out = kp.Tensor([0, 0, 0]) # 3. Initialise the Kompute Tensors in the GPU mgr.eval_tensor_create_def([tensor_in_a, tensor_in_b, tensor_out]) # 4. Define the multiplication shader code to run on the GPU @ps.python2shader def compute_shader_multiply(index=("input", "GlobalInvocationId", ps.ivec3), data1=("buffer", 0, ps.Array(ps.f32)), data2=("buffer", 1, ps.Array(ps.f32)), data3=("buffer", 2, ps.Array(ps.f32))): i = index.x data3[i] = data1[i] * data2[i] # 5. Run shader code against our previously defined tensors mgr.eval_algo_data_def( [tensor_in_a, tensor_in_b, tensor_out], compute_shader_multiply.to_spirv()) # 6. Sync tensor data from GPU back to local mgr.eval_tensor_sync_local_def([tensor_out]) assert tensor_out.data() == [2.0, 4.0, 6.0] assert np.all(tensor_out.numpy() == [2.0, 4.0, 6.0])