spcl
diff --git a/‎.gitignore‎
Lines changed: 1 addition & 0 deletions b/‎.gitignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md‎
Lines changed: 26 additions & 6 deletions b/‎README.md‎
Lines changed: 26 additions & 6 deletions
diff --git a/‎bench_info/covariance2.json‎
Lines changed: 26 additions & 0 deletions b/‎bench_info/covariance2.json‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎environment.yml‎
Lines changed: 17 additions & 0 deletions b/‎environment.yml‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎framework_info/dpnp_cpu.json‎
Lines changed: 10 additions & 0 deletions b/‎framework_info/dpnp_cpu.json‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎framework_info/dpnp_gpu.json‎
Lines changed: 11 additions & 0 deletions b/‎framework_info/dpnp_gpu.json‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎npbench/benchmarks/cavity_flow/cavity_flow_dpnp.py‎
Lines changed: 74 additions & 0 deletions b/‎npbench/benchmarks/cavity_flow/cavity_flow_dpnp.py‎
Lines changed: 74 additions & 0 deletions
diff --git a/‎npbench/benchmarks/channel_flow/channel_flow_dpnp.py‎
Lines changed: 142 additions & 0 deletions b/‎npbench/benchmarks/channel_flow/channel_flow_dpnp.py‎
Lines changed: 142 additions & 0 deletions
diff --git a/‎npbench/benchmarks/contour_integral/contour_integral_dpnp.py‎
Lines changed: 26 additions & 0 deletions b/‎npbench/benchmarks/contour_integral/contour_integral_dpnp.py‎
Lines changed: 26 additions & 0 deletions
@@ -130,3 +130,4 @@ dmypy.json
 
 # dace
 .dacecache/
+*.csv
@@ -4,13 +4,16 @@
 ## Quickstart
 
 To install NPBench, simply execute:
+
 ```
 python -m pip install -r requirements.txt
 python -m pip install .
 ```
+
 You can then run a subset of the benchmarks with NumPy, Numba, and DaCe and plot
 the speedup of DaCe and Numba against NumPy:
-```
+
+``` bash
 python -m pip install numba
 python -m pip install dace
 python quickstart.py
@@ -22,6 +25,7 @@ python plot_results.py
 Currently, the following frameworks are supported (in alphabetical order):
 - CuPy
 - DaCe
+- Dpnp
 - JAX
 - Numba
 - NumPy
@@ -56,6 +60,27 @@ However, you may want to install the latest version from the [GitHub repository]
 To run NPBench with DaCe, you have to select as framework (see details below)
 either `dace_cpu` or `dace_gpu`.
 
+### DPNP
+
+With `dpnp` it is strongly recommended to use `conda` instead of `pip` for its dependency on intel packages. 
+Refer to this 
+[LINK](https://intelpython.github.io/dpnp/quick_start_guide.html#building-for-custom-sycl-targets) to know more 
+about building custom SYCL targets or installing `dpnp` package from the `intel` channel.
+
+Unlike the pip installation, with conda it is advisable to try installing all packages at once.
+Edit the `environment.yml` to include packages and optional dependencies (e.g. hardware-dependent frameworks
+or utilities such as `ipython`). Then type:
+
+``` bash
+$ conda env create -f environment.yml    # environment.yml contains all the right dependencies
+$ conda activate npb              # Activate the environment
+$ python -m pip install pygount          # Only dependency not distributed with conda
+```
+
+To run NPBench with dpnp, You must select as framework, either `dpnp_cpu` or `dpnp_gpu`, depending on your hardware. See details below.
+
+_DPNP only contains a subset of the benchmarks, selected on interest and best-effort basis._
+
 ### Jax
 
 JAX can be installed with pip:
@@ -73,7 +98,6 @@ JAX can be installed with pip:
   ```
 For more installation options, please consult the JAX [installation guide](https://jax.readthedocs.io/en/latest/installation.html#installation).
 
-
 ### Numba
 
 Numba can be installed with pip:
@@ -172,7 +196,3 @@ NPBench is a collection of scientific Python/NumPy codes from various domains th
 - Pythran [benchmarks](https://github.com/serge-sans-paille/numpy-benchmarks/)
 - [Stockham-FFT](http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-287731)
 - Weather stencils from [gt4py](https://github.com/GridTools/gt4py)
-
-
-
-
 
@@ -0,0 +1,26 @@
+{
+    "benchmark": {
+        "name": "Covariance2",
+        "short_name": "covarian2",
+        "relative_path": "polybench/covariance2",
+        "module_name": "covariance2",
+        "func_name": "kernel",
+        "kind": "microbench",
+        "domain": "Learning",
+        "dwarf": "dense_linear_algebra",
+        "parameters": {
+            "S": { "M": 500, "N": 600 },
+            "M": { "M": 1400, "N": 1800 },
+            "L": { "M": 3200, "N": 4000 },
+            "paper": { "M": 1200, "N": 1400 }
+        },
+        "init": {
+            "func_name": "initialize",
+            "input_args": ["M", "N"],
+            "output_args": ["float_n", "data"]
+        },
+        "input_args": ["M", "float_n", "data"],
+        "array_args": ["data"],
+        "output_args": []
+    }
+}
@@ -0,0 +1,17 @@
+name: npb
+channels:
+  - conda-forge
+  - https://software.repos.intel.com/python/conda
+dependencies:
+  - python=3.10.14
+  - numpy=1.26.4    # dpnp theoretically requires numpy<=1.24.4, numba-dpex numpy>=1.26.4; seems that 1.26.4 works fine even for dpnp
+  - matplotlib
+  - pandas
+  - scipy
+  - dpnp
+  - dace
+  - numba
+  - pythran
+  - cupy
+  # pygount has to be installed via pip
+
@@ -0,0 +1,10 @@
+{
+    "framework": {
+        "simple_name": "dpnp_cpu",
+        "full_name": "Dpnp_CPU",
+        "prefix": "dpc",
+        "postfix": "dpnp_cpu",
+        "class": "DpnpFramework",
+        "arch": "cpu"
+    }
+}
@@ -0,0 +1,11 @@
+{
+    "framework": {
+        "simple_name": "dpnp_gpu",
+        "full_name": "Dpnp_GPU",
+        "prefix": "dpg",
+        "postfix": "dpnp_gpu",
+        "class": "DpnpFramework",
+        "arch": "gpu"
+    }
+}
+
@@ -0,0 +1,74 @@
+import dpnp as np
+
+def build_up_b(b, rho, dt, u, v, dx, dy):
+    b[1:-1, 1:-1] = (
+        rho * (
+            (1 / dt * ((u[1:-1, 2:] - u[1:-1, 0:-2]) / (2 * dx) +
+                        (v[2:, 1:-1] - v[0:-2, 1:-1]) / (2 * dy))) -
+            ((u[1:-1, 2:] - u[1:-1, 0:-2]) / (2 * dx))**2 -
+            2 * ((u[2:, 1:-1] - u[0:-2, 1:-1]) / (2 * dy) *
+                 (v[1:-1, 2:] - v[1:-1, 0:-2]) / (2 * dx)) -
+            ((v[2:, 1:-1] - v[0:-2, 1:-1]) / (2 * dy))**2
+        )
+    )
+
+def pressure_poisson(nit, p, dx, dy, b):
+    pn = np.empty_like(p)
+    for q in range(nit):
+        pn[:] = p.copy()
+        p[1:-1, 1:-1] = (
+            ((pn[1:-1, 2:] + pn[1:-1, 0:-2]) * dy**2 +
+             (pn[2:, 1:-1] + pn[0:-2, 1:-1]) * dx**2) /
+            (2 * (dx**2 + dy**2)) - dx**2 * dy**2 /
+            (2 * (dx**2 + dy**2)) * b[1:-1, 1:-1]
+        )
+
+        p[:, -1] = p[:, -2]  # dp/dx = 0 at x = 2
+        p[0, :] = p[1, :]  # dp/dy = 0 at y = 0
+        p[:, 0] = p[:, 1]  # dp/dx = 0 at x = 0
+        p[-1, :] = 0  # p = 0 at y = 2
+
+def cavity_flow(nx, ny, nt, nit, u, v, dt, dx, dy, p, rho, nu):
+    un = np.empty_like(u)
+    vn = np.empty_like(v)
+    b = np.zeros((ny, nx))
+
+    for n in range(nt):
+        un[:] = u.copy()
+        vn[:] = v.copy()
+
+        build_up_b(b, rho, dt, u, v, dx, dy)
+        pressure_poisson(nit, p, dx, dy, b)
+
+        u[1:-1, 1:-1] = (
+            un[1:-1, 1:-1] - un[1:-1, 1:-1] * dt / dx *
+            (un[1:-1, 1:-1] - un[1:-1, 0:-2]) -
+            vn[1:-1, 1:-1] * dt / dy *
+            (un[1:-1, 1:-1] - un[0:-2, 1:-1]) - dt / (2 * rho * dx) *
+            (p[1:-1, 2:] - p[1:-1, 0:-2]) + nu *
+            (dt / dx**2 *
+             (un[1:-1, 2:] - 2 * un[1:-1, 1:-1] + un[1:-1, 0:-2]) +
+             dt / dy**2 *
+             (un[2:, 1:-1] - 2 * un[1:-1, 1:-1] + un[0:-2, 1:-1]))
+        )
+
+        v[1:-1, 1:-1] = (
+            vn[1:-1, 1:-1] - un[1:-1, 1:-1] * dt / dx *
+            (vn[1:-1, 1:-1] - vn[1:-1, 0:-2]) -
+            vn[1:-1, 1:-1] * dt / dy *
+            (vn[1:-1, 1:-1] - vn[0:-2, 1:-1]) - dt / (2 * rho * dy) *
+            (p[2:, 1:-1] - p[0:-2, 1:-1]) + nu *
+            (dt / dx**2 *
+             (vn[1:-1, 2:] - 2 * vn[1:-1, 1:-1] + vn[1:-1, 0:-2]) +
+             dt / dy**2 *
+             (vn[2:, 1:-1] - 2 * vn[1:-1, 1:-1] + vn[0:-2, 1:-1]))
+        )
+
+        u[0, :] = 0
+        u[:, 0] = 0
+        u[:, -1] = 0
+        u[-1, :] = 1  # set velocity on cavity lid equal to 1
+        v[0, :] = 0
+        v[-1, :] = 0
+        v[:, 0] = 0
+        v[:, -1] = 0
@@ -0,0 +1,142 @@
+import dpnp as np
+
+def build_up_b(rho, dt, dx, dy, u, v):
+    b = np.zeros_like(u)
+    b[1:-1,
+      1:-1] = (rho * (1 / dt * ((u[1:-1, 2:] - u[1:-1, 0:-2]) / (2 * dx) +
+                                (v[2:, 1:-1] - v[0:-2, 1:-1]) / (2 * dy)) -
+                      ((u[1:-1, 2:] - u[1:-1, 0:-2]) / (2 * dx))**2 - 2 *
+                      ((u[2:, 1:-1] - u[0:-2, 1:-1]) / (2 * dy) *
+                       (v[1:-1, 2:] - v[1:-1, 0:-2]) / (2 * dx)) -
+                      ((v[2:, 1:-1] - v[0:-2, 1:-1]) / (2 * dy))**2))
+
+    # Periodic BC Pressure @ x = 2
+    b[1:-1, -1] = (rho * (1 / dt * ((u[1:-1, 0] - u[1:-1, -2]) / (2 * dx) +
+                                    (v[2:, -1] - v[0:-2, -1]) / (2 * dy)) -
+                          ((u[1:-1, 0] - u[1:-1, -2]) / (2 * dx))**2 - 2 *
+                          ((u[2:, -1] - u[0:-2, -1]) / (2 * dy) *
+                           (v[1:-1, 0] - v[1:-1, -2]) / (2 * dx)) -
+                          ((v[2:, -1] - v[0:-2, -1]) / (2 * dy))**2))
+
+    # Periodic BC Pressure @ x = 0
+    b[1:-1, 0] = (rho * (1 / dt * ((u[1:-1, 1] - u[1:-1, -1]) / (2 * dx) +
+                                   (v[2:, 0] - v[0:-2, 0]) / (2 * dy)) -
+                         ((u[1:-1, 1] - u[1:-1, -1]) / (2 * dx))**2 - 2 *
+                         ((u[2:, 0] - u[0:-2, 0]) / (2 * dy) *
+                          (v[1:-1, 1] - v[1:-1, -1]) /
+                          (2 * dx)) - ((v[2:, 0] - v[0:-2, 0]) / (2 * dy))**2))
+
+    return b
+
+
+def pressure_poisson_periodic(nit, p, dx, dy, b):
+    pn = np.empty_like(p)
+
+    for q in range(nit):
+        pn = p.copy()
+        p[1:-1, 1:-1] = (((pn[1:-1, 2:] + pn[1:-1, 0:-2]) * dy**2 +
+                          (pn[2:, 1:-1] + pn[0:-2, 1:-1]) * dx**2) /
+                         (2 * (dx**2 + dy**2)) - dx**2 * dy**2 /
+                         (2 * (dx**2 + dy**2)) * b[1:-1, 1:-1])
+
+        # Periodic BC Pressure @ x = 2
+        p[1:-1, -1] = (((pn[1:-1, 0] + pn[1:-1, -2]) * dy**2 +
+                        (pn[2:, -1] + pn[0:-2, -1]) * dx**2) /
+                       (2 * (dx**2 + dy**2)) - dx**2 * dy**2 /
+                       (2 * (dx**2 + dy**2)) * b[1:-1, -1])
+
+        # Periodic BC Pressure @ x = 0
+        p[1:-1,
+          0] = (((pn[1:-1, 1] + pn[1:-1, -1]) * dy**2 +
+                 (pn[2:, 0] + pn[0:-2, 0]) * dx**2) / (2 * (dx**2 + dy**2)) -
+                dx**2 * dy**2 / (2 * (dx**2 + dy**2)) * b[1:-1, 0])
+
+        # Wall boundary conditions, pressure
+        p[-1, :] = p[-2, :]  # dp/dy = 0 at y = 2
+        p[0, :] = p[1, :]  # dp/dy = 0 at y = 0
+
+
+def channel_flow(nit, u, v, dt, dx, dy, p, rho, nu, F):
+    udiff = 1
+    stepcount = 0
+
+    while udiff > .001:
+        un = u.copy()
+        vn = v.copy()
+
+        b = build_up_b(rho, dt, dx, dy, u, v)
+        pressure_poisson_periodic(nit, p, dx, dy, b)
+
+        u[1:-1,
+          1:-1] = (un[1:-1, 1:-1] - un[1:-1, 1:-1] * dt / dx *
+                   (un[1:-1, 1:-1] - un[1:-1, 0:-2]) -
+                   vn[1:-1, 1:-1] * dt / dy *
+                   (un[1:-1, 1:-1] - un[0:-2, 1:-1]) - dt / (2 * rho * dx) *
+                   (p[1:-1, 2:] - p[1:-1, 0:-2]) + nu *
+                   (dt / dx**2 *
+                    (un[1:-1, 2:] - 2 * un[1:-1, 1:-1] + un[1:-1, 0:-2]) +
+                    dt / dy**2 *
+                    (un[2:, 1:-1] - 2 * un[1:-1, 1:-1] + un[0:-2, 1:-1])) +
+                   F * dt)
+
+        v[1:-1,
+          1:-1] = (vn[1:-1, 1:-1] - un[1:-1, 1:-1] * dt / dx *
+                   (vn[1:-1, 1:-1] - vn[1:-1, 0:-2]) -
+                   vn[1:-1, 1:-1] * dt / dy *
+                   (vn[1:-1, 1:-1] - vn[0:-2, 1:-1]) - dt / (2 * rho * dy) *
+                   (p[2:, 1:-1] - p[0:-2, 1:-1]) + nu *
+                   (dt / dx**2 *
+                    (vn[1:-1, 2:] - 2 * vn[1:-1, 1:-1] + vn[1:-1, 0:-2]) +
+                    dt / dy**2 *
+                    (vn[2:, 1:-1] - 2 * vn[1:-1, 1:-1] + vn[0:-2, 1:-1])))
+
+        # Periodic BC u @ x = 2
+        u[1:-1, -1] = (
+            un[1:-1, -1] - un[1:-1, -1] * dt / dx *
+            (un[1:-1, -1] - un[1:-1, -2]) - vn[1:-1, -1] * dt / dy *
+            (un[1:-1, -1] - un[0:-2, -1]) - dt / (2 * rho * dx) *
+            (p[1:-1, 0] - p[1:-1, -2]) + nu *
+            (dt / dx**2 *
+             (un[1:-1, 0] - 2 * un[1:-1, -1] + un[1:-1, -2]) + dt / dy**2 *
+             (un[2:, -1] - 2 * un[1:-1, -1] + un[0:-2, -1])) + F * dt)
+
+        # Periodic BC u @ x = 0
+        u[1:-1,
+          0] = (un[1:-1, 0] - un[1:-1, 0] * dt / dx *
+                (un[1:-1, 0] - un[1:-1, -1]) - vn[1:-1, 0] * dt / dy *
+                (un[1:-1, 0] - un[0:-2, 0]) - dt / (2 * rho * dx) *
+                (p[1:-1, 1] - p[1:-1, -1]) + nu *
+                (dt / dx**2 *
+                 (un[1:-1, 1] - 2 * un[1:-1, 0] + un[1:-1, -1]) + dt / dy**2 *
+                 (un[2:, 0] - 2 * un[1:-1, 0] + un[0:-2, 0])) + F * dt)
+
+        # Periodic BC v @ x = 2
+        v[1:-1, -1] = (
+            vn[1:-1, -1] - un[1:-1, -1] * dt / dx *
+            (vn[1:-1, -1] - vn[1:-1, -2]) - vn[1:-1, -1] * dt / dy *
+            (vn[1:-1, -1] - vn[0:-2, -1]) - dt / (2 * rho * dy) *
+            (p[2:, -1] - p[0:-2, -1]) + nu *
+            (dt / dx**2 *
+             (vn[1:-1, 0] - 2 * vn[1:-1, -1] + vn[1:-1, -2]) + dt / dy**2 *
+             (vn[2:, -1] - 2 * vn[1:-1, -1] + vn[0:-2, -1])))
+
+        # Periodic BC v @ x = 0
+        v[1:-1,
+          0] = (vn[1:-1, 0] - un[1:-1, 0] * dt / dx *
+                (vn[1:-1, 0] - vn[1:-1, -1]) - vn[1:-1, 0] * dt / dy *
+                (vn[1:-1, 0] - vn[0:-2, 0]) - dt / (2 * rho * dy) *
+                (p[2:, 0] - p[0:-2, 0]) + nu *
+                (dt / dx**2 *
+                 (vn[1:-1, 1] - 2 * vn[1:-1, 0] + vn[1:-1, -1]) + dt / dy**2 *
+                 (vn[2:, 0] - 2 * vn[1:-1, 0] + vn[0:-2, 0])))
+
+        # Wall BC: u,v = 0 @ y = 0,2
+        u[0, :] = 0
+        u[-1, :] = 0
+        v[0, :] = 0
+        v[-1, :] = 0
+
+        udiff = (np.sum(u) - np.sum(un)) / np.sum(u)
+        stepcount += 1
+
+    return stepcount
@@ -0,0 +1,26 @@
+import dpnp as np
+
+def contour_integral(NR, NM, slab_per_bc, Ham, int_pts, Y):
+    P0 = np.zeros((NR, NM), dtype=np.complex128)
+    P1 = np.zeros((NR, NM), dtype=np.complex128)
+    
+    for z in int_pts:
+        Tz = np.zeros((NR, NR), dtype=np.complex128)
+        
+        for n in range(slab_per_bc + 1):
+            zz = np.power(z, slab_per_bc / 2 - n)
+            Tz += zz * Ham[n]
+        
+        if NR == NM:
+            X = np.linalg.inv(Tz)
+        else:
+            X = np.linalg.solve(Tz, Y)
+        
+        if abs(z) < 1.0:
+            X = -X
+        
+        P0 += X
+        P1 += z * X
+
+    return P0, P1
+
Original file line number	Diff line number	Diff line change
`@@ -130,3 +130,4 @@ dmypy.json`
`130`	`130`
`131`	`131`	`# dace`
`132`	`132`	`.dacecache/`
	`133`	`+*.csv`