From 37a62bb7069d2cfaabd570bcc4373039fb9af9f6 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Wed, 19 Feb 2025 14:25:18 +0100
Subject: [PATCH 01/10] add void* to tabulate_tensor

---
 ffcx/codegeneration/C/expressions_template.py |  3 ++-
 ffcx/codegeneration/C/integrals_template.py   |  3 ++-
 ffcx/codegeneration/ufcx.h                    | 15 +++++++++++----
 ffcx/codegeneration/utils.py                  |  1 +
 test/test_add_mode.py                         |  3 +++
 test/test_jit_expression.py                   |  7 +++++++
 test/test_jit_forms.py                        | 17 +++++++++++++++++
 test/test_submesh.py                          |  1 +
 test/test_tensor_product.py                   |  2 ++
 9 files changed, 46 insertions(+), 6 deletions(-)

diff --git a/ffcx/codegeneration/C/expressions_template.py b/ffcx/codegeneration/C/expressions_template.py
index 079025d9a..dc0a0574b 100644
--- a/ffcx/codegeneration/C/expressions_template.py
+++ b/ffcx/codegeneration/C/expressions_template.py
@@ -23,7 +23,8 @@
                                     const {scalar_type}* restrict c,
                                     const {geom_type}* restrict coordinate_dofs,
                                     const int* restrict entity_local_index,
-                                    const uint8_t* restrict quadrature_permutation)
+                                    const uint8_t* restrict quadrature_permutation,
+                                    void* user_data)
 {{
 {tabulate_expression}
 }}
diff --git a/ffcx/codegeneration/C/integrals_template.py b/ffcx/codegeneration/C/integrals_template.py
index 2bb1568ec..407ed7a96 100644
--- a/ffcx/codegeneration/C/integrals_template.py
+++ b/ffcx/codegeneration/C/integrals_template.py
@@ -16,7 +16,8 @@
                                     const {scalar_type}* restrict c,
                                     const {geom_type}* restrict coordinate_dofs,
                                     const int* restrict entity_local_index,
-                                    const uint8_t* restrict quadrature_permutation)
+                                    const uint8_t* restrict quadrature_permutation,
+                                    void* user_data)
 {{
 {tabulate_tensor}
 }}
diff --git a/ffcx/codegeneration/ufcx.h b/ffcx/codegeneration/ufcx.h
index 73352ef61..b768bb8cd 100644
--- a/ffcx/codegeneration/ufcx.h
+++ b/ffcx/codegeneration/ufcx.h
@@ -86,11 +86,15 @@ extern "C"
   /// For integrals not on interior facets, this argument has no effect and a
   /// null pointer can be passed. For interior facets the array will have size 2
   /// (one permutation for each cell adjacent to the facet).
+  /// @param[in] user_data Custom user data passed to the tabulate function. 
+  /// For example, a struct with additional data needed for the tabulate function.
+  /// See the implementation of runtime integrals for further details.
   typedef void(ufcx_tabulate_tensor_float32)(
       float* restrict A, const float* restrict w, const float* restrict c,
       const float* restrict coordinate_dofs,
       const int* restrict entity_local_index,
-      const uint8_t* restrict quadrature_permutation);
+      const uint8_t* restrict quadrature_permutation,
+      void* user_data);
 
   /// Tabulate integral into tensor A with compiled
   /// quadrature rule and double precision
@@ -100,7 +104,8 @@ extern "C"
       double* restrict A, const double* restrict w, const double* restrict c,
       const double* restrict coordinate_dofs,
       const int* restrict entity_local_index,
-      const uint8_t* restrict quadrature_permutation);
+      const uint8_t* restrict quadrature_permutation,
+      void* user_data);
 
 #ifndef __STDC_NO_COMPLEX__
   /// Tabulate integral into tensor A with compiled
@@ -111,7 +116,8 @@ extern "C"
       float _Complex* restrict A, const float _Complex* restrict w,
       const float _Complex* restrict c, const float* restrict coordinate_dofs,
       const int* restrict entity_local_index,
-      const uint8_t* restrict quadrature_permutation);
+      const uint8_t* restrict quadrature_permutation,
+      void* user_data);
 #endif // __STDC_NO_COMPLEX__
 
 #ifndef __STDC_NO_COMPLEX__
@@ -123,7 +129,8 @@ extern "C"
       double _Complex* restrict A, const double _Complex* restrict w,
       const double _Complex* restrict c, const double* restrict coordinate_dofs,
       const int* restrict entity_local_index,
-      const uint8_t* restrict quadrature_permutation);
+      const uint8_t* restrict quadrature_permutation,
+      void* user_data);
 #endif // __STDC_NO_COMPLEX__
 
   typedef struct ufcx_integral
diff --git a/ffcx/codegeneration/utils.py b/ffcx/codegeneration/utils.py
index bc0226e8f..4f4573c95 100644
--- a/ffcx/codegeneration/utils.py
+++ b/ffcx/codegeneration/utils.py
@@ -80,6 +80,7 @@ def numba_ufcx_kernel_signature(dtype: npt.DTypeLike, xdtype: npt.DTypeLike):
             types.CPointer(from_dtype(xdtype)),
             types.CPointer(types.intc),
             types.CPointer(types.uint8),
+            types.CPointer(types.void),
         )
     except ImportError as e:
         raise e
diff --git a/test/test_add_mode.py b/test/test_add_mode.py
index 574b02946..f57fde78b 100644
--- a/test/test_add_mode.py
+++ b/test/test_add_mode.py
@@ -86,6 +86,7 @@ def test_additive_facet_integral(dtype, compile_args):
             ffi.cast(f"{c_xtype} *", coords.ctypes.data),
             ffi.cast("int *", facets.ctypes.data),
             ffi.cast("uint8_t *", perm.ctypes.data),
+            ffi.NULL,
         )
         assert np.isclose(A.sum(), np.sqrt(12) * (i + 1))
 
@@ -158,6 +159,7 @@ def test_additive_cell_integral(dtype, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     A0 = np.array(A)
@@ -169,6 +171,7 @@ def test_additive_cell_integral(dtype, compile_args):
             ffi.cast(f"{c_xtype} *", coords.ctypes.data),
             ffi.NULL,
             ffi.NULL,
+            ffi.NULL,
         )
 
         assert np.all(np.isclose(A, (i + 2) * A0))
diff --git a/test/test_jit_expression.py b/test/test_jit_expression.py
index bcc489654..64e00b65c 100644
--- a/test/test_jit_expression.py
+++ b/test/test_jit_expression.py
@@ -64,6 +64,7 @@ def test_matvec(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
+        ffi.NULL,
     )
 
     # Check the computation against correct NumPy value
@@ -133,6 +134,7 @@ def test_rank1(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
+        ffi.NULL,
     )
 
     f = np.array([[1.0, 2.0, 3.0], [-4.0, -5.0, 6.0]])
@@ -203,6 +205,7 @@ def test_elimiate_zero_tables_tensor(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
+        ffi.NULL,
     )
 
     def exact_expr(x):
@@ -261,6 +264,7 @@ def test_grad_constant(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
+        ffi.NULL,  
     )
 
     assert output[0] == pytest.approx(consts[1] * 2 * points[0, 0])
@@ -316,6 +320,7 @@ def test_facet_expression(compile_args):
             ffi.cast(f"{c_xtype} *", coords.ctypes.data),
             ffi.cast("int *", entity_index.ctypes.data),
             ffi.cast("uint8_t *", quad_perm.ctypes.data),
+            ffi.NULL,
         )
         # Assert that facet normal is perpendicular to tangent
         assert np.isclose(np.dot(output, tangent), 0)
@@ -366,6 +371,7 @@ def check_expression(expression_class, output_shape, entity_values, reference_va
                 ffi_data["coords"],
                 ffi_data["entity_index"],
                 ffi_data["quad_perm"],
+                ffi.NULL,
             )
             np.testing.assert_allclose(output, ref_val)
 
@@ -430,5 +436,6 @@ def test_facet_geometry_expressions_3D(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
+        ffi.NULL,
     )
     np.testing.assert_allclose(output, np.asarray(ref_fev)[:3, :])
diff --git a/test/test_jit_forms.py b/test/test_jit_forms.py
index ef49313fe..1a8c9ae31 100644
--- a/test/test_jit_forms.py
+++ b/test/test_jit_forms.py
@@ -89,6 +89,7 @@ def test_laplace_bilinear_form_2d(dtype, expected_result, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     assert np.allclose(A, np.trace(kappa_value) * expected_result)
@@ -233,6 +234,7 @@ def test_helmholtz_form_2d(dtype, expected_result, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     np.testing.assert_allclose(A, expected_result)
@@ -305,6 +307,7 @@ def test_laplace_bilinear_form_3d(dtype, expected_result, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     assert np.allclose(A, expected_result)
@@ -342,6 +345,7 @@ def test_form_coefficient(compile_args):
         ffi.cast("double  *", coords.ctypes.data),
         ffi.NULL,
         ffi.cast("uint8_t *", perm.ctypes.data),
+        ffi.NULL,
     )
 
     A_analytic = np.array([[2, 1, 1], [1, 2, 1], [1, 1, 2]], dtype=np.float64) / 24.0
@@ -452,6 +456,7 @@ def test_interior_facet_integral(dtype, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", facets.ctypes.data),
         ffi.cast("uint8_t *", perms.ctypes.data),
+        ffi.NULL,
     )
 
 
@@ -512,6 +517,7 @@ def test_conditional(dtype, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     expected_result = np.array([[2, -1, -1], [-1, 1, 0], [-1, 0, 1]], dtype=dtype)
@@ -530,6 +536,7 @@ def test_conditional(dtype, compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     expected_result = np.ones(3, dtype=dtype)
@@ -581,6 +588,7 @@ def test_custom_quadrature(compile_args):
         ffi.cast("double *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     # Check that A is diagonal
@@ -690,6 +698,7 @@ def test_lagrange_triangle(compile_args, order, dtype, sym_fun, ufl_fun):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     # Check that the result is the same as for sympy
@@ -817,6 +826,7 @@ def test_lagrange_tetrahedron(compile_args, order, dtype, sym_fun, ufl_fun):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     # Check that the result is the same as for sympy
@@ -852,6 +862,7 @@ def test_prism(compile_args):
         ffi.cast("double *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     assert np.isclose(sum(b), 0.5)
@@ -898,6 +909,7 @@ def test_complex_operations(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     expected_result = np.array(
@@ -918,6 +930,7 @@ def test_complex_operations(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     assert np.allclose(J_2, expected_result)
@@ -980,6 +993,7 @@ def test_interval_vertex_quadrature(compile_args):
         ffi.cast("double *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
     assert np.isclose(J[0], (0.5 * a + 0.5 * b) * np.abs(b - a))
 
@@ -1033,6 +1047,7 @@ def test_facet_vertex_quadrature(compile_args):
             ffi.cast("double *", coords.ctypes.data),
             ffi.cast("int *", facets.ctypes.data),
             ffi.NULL,
+            ffi.NULL,
         )
         solutions.append(J[0])
         # Test against exact result
@@ -1084,6 +1099,7 @@ def test_manifold_derivatives(compile_args):
         ffi.cast("double  *", coords.ctypes.data),
         ffi.NULL,
         ffi.cast("uint8_t *", perm.ctypes.data),
+        ffi.NULL,
     )
 
     assert np.isclose(J[0], 0.0)
@@ -1186,6 +1202,7 @@ def tabulate_tensor(ele_type, V_cell_type, W_cell_type, coeffs):
             ffi.cast(f"{c_xtype} *", coords.ctypes.data),
             ffi.cast("int *", facet.ctypes.data),
             ffi.cast("uint8_t *", perm.ctypes.data),
+            ffi.NULL,
         )
 
         return A
diff --git a/test/test_submesh.py b/test/test_submesh.py
index 0379fbd13..5573ec4fa 100644
--- a/test/test_submesh.py
+++ b/test/test_submesh.py
@@ -49,6 +49,7 @@ def compute_tensor(forms: list[ufl.form.Form], dtype: str, compile_args: list[st
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
     return A
 
diff --git a/test/test_tensor_product.py b/test/test_tensor_product.py
index a5ef2a370..f0c81206a 100644
--- a/test/test_tensor_product.py
+++ b/test/test_tensor_product.py
@@ -110,6 +110,7 @@ def test_bilinear_form(dtype, P, cell_type):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     # Use sum factorization
@@ -125,6 +126,7 @@ def test_bilinear_form(dtype, P, cell_type):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.NULL,
         ffi.NULL,
+        ffi.NULL,
     )
 
     np.testing.assert_allclose(A, A1, rtol=1e-6, atol=1e-6)

From 11cb033649448fff96f006d180d33719413d6f80 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Wed, 19 Feb 2025 15:38:03 +0100
Subject: [PATCH 02/10] try to trigger CI

---
 .github/workflows/pythonapp.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/pythonapp.yml b/.github/workflows/pythonapp.yml
index 4d6b91eed..761e76a59 100644
--- a/.github/workflows/pythonapp.yml
+++ b/.github/workflows/pythonapp.yml
@@ -8,6 +8,7 @@ on:
   push:
     branches:
       - "**"
+      - sclaus/add-void-to-kernels
     tags:
       - "v*"
   pull_request:

From bb4e90a864cdd4e82a2f4b56d160604c60193196 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Wed, 19 Feb 2025 15:44:34 +0100
Subject: [PATCH 03/10] try to trigger CI

---
 .github/workflows/pythonapp.yml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.github/workflows/pythonapp.yml b/.github/workflows/pythonapp.yml
index 761e76a59..4d6b91eed 100644
--- a/.github/workflows/pythonapp.yml
+++ b/.github/workflows/pythonapp.yml
@@ -8,7 +8,6 @@ on:
   push:
     branches:
       - "**"
-      - sclaus/add-void-to-kernels
     tags:
       - "v*"
   pull_request:

From 49b23a0c80ccaaf07fc807ee18903b361a3f8c58 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Wed, 19 Feb 2025 15:53:46 +0100
Subject: [PATCH 04/10] run ruff

---
 test/test_jit_expression.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/test_jit_expression.py b/test/test_jit_expression.py
index 64e00b65c..8261caf77 100644
--- a/test/test_jit_expression.py
+++ b/test/test_jit_expression.py
@@ -264,7 +264,7 @@ def test_grad_constant(compile_args):
         ffi.cast(f"{c_xtype} *", coords.ctypes.data),
         ffi.cast("int *", entity_index.ctypes.data),
         ffi.cast("uint8_t *", quad_perm.ctypes.data),
-        ffi.NULL,  
+        ffi.NULL,
     )
 
     assert output[0] == pytest.approx(consts[1] * 2 * points[0, 0])

From bb022ad0b961fd3e8075d0730b0f1ce46c65607f Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Wed, 19 Feb 2025 17:06:00 +0100
Subject: [PATCH 05/10] rename user_data custom_data

---
 ffcx/codegeneration/C/expressions_template.py |  2 +-
 ffcx/codegeneration/C/integrals_template.py   |  2 +-
 ffcx/codegeneration/ufcx.h                    | 10 +++++-----
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/ffcx/codegeneration/C/expressions_template.py b/ffcx/codegeneration/C/expressions_template.py
index dc0a0574b..da439cfaf 100644
--- a/ffcx/codegeneration/C/expressions_template.py
+++ b/ffcx/codegeneration/C/expressions_template.py
@@ -24,7 +24,7 @@
                                     const {geom_type}* restrict coordinate_dofs,
                                     const int* restrict entity_local_index,
                                     const uint8_t* restrict quadrature_permutation,
-                                    void* user_data)
+                                    void* custom_data)
 {{
 {tabulate_expression}
 }}
diff --git a/ffcx/codegeneration/C/integrals_template.py b/ffcx/codegeneration/C/integrals_template.py
index 407ed7a96..54d3a593b 100644
--- a/ffcx/codegeneration/C/integrals_template.py
+++ b/ffcx/codegeneration/C/integrals_template.py
@@ -17,7 +17,7 @@
                                     const {geom_type}* restrict coordinate_dofs,
                                     const int* restrict entity_local_index,
                                     const uint8_t* restrict quadrature_permutation,
-                                    void* user_data)
+                                    void* custom_data)
 {{
 {tabulate_tensor}
 }}
diff --git a/ffcx/codegeneration/ufcx.h b/ffcx/codegeneration/ufcx.h
index b768bb8cd..dd5137102 100644
--- a/ffcx/codegeneration/ufcx.h
+++ b/ffcx/codegeneration/ufcx.h
@@ -86,7 +86,7 @@ extern "C"
   /// For integrals not on interior facets, this argument has no effect and a
   /// null pointer can be passed. For interior facets the array will have size 2
   /// (one permutation for each cell adjacent to the facet).
-  /// @param[in] user_data Custom user data passed to the tabulate function. 
+  /// @param[in] custom_data Custom user data passed to the tabulate function. 
   /// For example, a struct with additional data needed for the tabulate function.
   /// See the implementation of runtime integrals for further details.
   typedef void(ufcx_tabulate_tensor_float32)(
@@ -94,7 +94,7 @@ extern "C"
       const float* restrict coordinate_dofs,
       const int* restrict entity_local_index,
       const uint8_t* restrict quadrature_permutation,
-      void* user_data);
+      void* custom_data);
 
   /// Tabulate integral into tensor A with compiled
   /// quadrature rule and double precision
@@ -105,7 +105,7 @@ extern "C"
       const double* restrict coordinate_dofs,
       const int* restrict entity_local_index,
       const uint8_t* restrict quadrature_permutation,
-      void* user_data);
+      void* custom_data);
 
 #ifndef __STDC_NO_COMPLEX__
   /// Tabulate integral into tensor A with compiled
@@ -117,7 +117,7 @@ extern "C"
       const float _Complex* restrict c, const float* restrict coordinate_dofs,
       const int* restrict entity_local_index,
       const uint8_t* restrict quadrature_permutation,
-      void* user_data);
+      void* custom_data);
 #endif // __STDC_NO_COMPLEX__
 
 #ifndef __STDC_NO_COMPLEX__
@@ -130,7 +130,7 @@ extern "C"
       const double _Complex* restrict c, const double* restrict coordinate_dofs,
       const int* restrict entity_local_index,
       const uint8_t* restrict quadrature_permutation,
-      void* user_data);
+      void* custom_data);
 #endif // __STDC_NO_COMPLEX__
 
   typedef struct ufcx_integral

From 9ab688c1042f12956ec8e88faa615fc12dfb2604 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Sat, 22 Feb 2025 01:18:07 +0100
Subject: [PATCH 06/10] add numba functions to obtain empty void* and
 conversion of numpy array to void*

---
 ffcx/codegeneration/utils.py | 54 ++++++++++++++++++++++++++++++++++++
 1 file changed, 54 insertions(+)

diff --git a/ffcx/codegeneration/utils.py b/ffcx/codegeneration/utils.py
index 4f4573c95..1b93887a6 100644
--- a/ffcx/codegeneration/utils.py
+++ b/ffcx/codegeneration/utils.py
@@ -10,6 +10,11 @@
 import numpy as np
 import numpy.typing as npt
 
+try:
+    import numba
+except ImportError:
+    numba = None
+
 
 def dtype_to_c_type(dtype: typing.Union[npt.DTypeLike, str]) -> str:
     """For a NumPy dtype, return the corresponding C type.
@@ -84,3 +89,52 @@ def numba_ufcx_kernel_signature(dtype: npt.DTypeLike, xdtype: npt.DTypeLike):
         )
     except ImportError as e:
         raise e
+
+
+if numba is not None:
+
+    @numba.extending.intrinsic
+    def empty_void_pointer(typingctx):
+        """Custom intrinsic to return an empty void* pointer.
+        This function creates a void pointer initialized to null (0).
+        This is used to pass a nullptr to the UFCx tabulate_tensor interface.
+        Args:
+            typingctx: The typing context.
+
+        Returns:
+            A Numba signature and a code generation function that returns a void pointer.
+        """  # noqa: D205
+
+        def codegen(context, builder, signature, args):
+            null_ptr = context.get_constant(numba.types.voidptr, 0)
+            return null_ptr
+
+        sig = numba.types.voidptr()
+        return sig, codegen
+
+    @numba.extending.intrinsic
+    def get_void_pointer(typingctx, arr):
+        """Custom intrinsic to get a void* pointer from a NumPy array.
+
+        This function takes a NumPy array and returns a void pointer to the array's data.
+        This is used to pass custom data organised in a NumPy array
+        to the UFCx tabulate_tensor interface.
+
+        Args:
+            typingctx: The typing context.
+            arr: The NumPy array to get the void pointer from.
+
+        Returns:
+            A Numba signature and a code generation function that returns a void pointer to the array's data.
+        """
+        if not isinstance(arr, numba.types.Array):
+            raise TypeError("Expected a NumPy array")
+
+        def codegen(context, builder, signature, args):
+            [arr] = args
+            raw_ptr = numba.core.cgutils.alloca_once_value(builder, arr)
+            void_ptr = builder.bitcast(raw_ptr, context.get_value_type(numba.types.voidptr))
+            return void_ptr
+
+        sig = numba.types.voidptr(arr)
+        return sig, codegen

From 52104cbf0b3ba3656313d086629b65da7863ebcb Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Sat, 22 Feb 2025 09:09:29 +0100
Subject: [PATCH 07/10] fix ruff check

---
 ffcx/codegeneration/utils.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/ffcx/codegeneration/utils.py b/ffcx/codegeneration/utils.py
index 1b93887a6..8632044a6 100644
--- a/ffcx/codegeneration/utils.py
+++ b/ffcx/codegeneration/utils.py
@@ -98,6 +98,7 @@ def empty_void_pointer(typingctx):
         """Custom intrinsic to return an empty void* pointer.
         This function creates a void pointer initialized to null (0).
         This is used to pass a nullptr to the UFCx tabulate_tensor interface.
+
         Args:
             typingctx: The typing context.
 
@@ -125,7 +126,8 @@ def get_void_pointer(typingctx, arr):
             arr: The NumPy array to get the void pointer from.
 
         Returns:
-            A Numba signature and a code generation function that returns a void pointer to the array's data.
+            A Numba signature and a code generation function that returns a void pointer
+            to the array's data.
         """
         if not isinstance(arr, numba.types.Array):
             raise TypeError("Expected a NumPy array")

From 7beaeef27fbe93c362094e9b67a26ec6cf4a6df0 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Sat, 22 Feb 2025 09:23:53 +0100
Subject: [PATCH 08/10] add line to remove noqa

---
 ffcx/codegeneration/utils.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/ffcx/codegeneration/utils.py b/ffcx/codegeneration/utils.py
index 8632044a6..871f80390 100644
--- a/ffcx/codegeneration/utils.py
+++ b/ffcx/codegeneration/utils.py
@@ -96,6 +96,7 @@ def numba_ufcx_kernel_signature(dtype: npt.DTypeLike, xdtype: npt.DTypeLike):
     @numba.extending.intrinsic
     def empty_void_pointer(typingctx):
         """Custom intrinsic to return an empty void* pointer.
+
         This function creates a void pointer initialized to null (0).
         This is used to pass a nullptr to the UFCx tabulate_tensor interface.
 
@@ -104,7 +105,7 @@ def empty_void_pointer(typingctx):
 
         Returns:
             A Numba signature and a code generation function that returns a void pointer.
-        """  # noqa: D205
+        """
 
         def codegen(context, builder, signature, args):
             null_ptr = context.get_constant(numba.types.voidptr, 0)

From abe2391c5d0bc2310c5bf91f80fb15dd0ee85da0 Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Thu, 6 Mar 2025 17:49:29 +0100
Subject: [PATCH 09/10] expand comment for numba intrinsic function

---
 ffcx/codegeneration/utils.py | 22 +++++++++++++++++++++-
 1 file changed, 21 insertions(+), 1 deletion(-)

diff --git a/ffcx/codegeneration/utils.py b/ffcx/codegeneration/utils.py
index 871f80390..99b031fb0 100644
--- a/ffcx/codegeneration/utils.py
+++ b/ffcx/codegeneration/utils.py
@@ -125,15 +125,35 @@ def get_void_pointer(typingctx, arr):
         Args:
             typingctx: The typing context.
             arr: The NumPy array to get the void pointer from.
+            In a multi-dimensional NumPy array, the memory is laid out in a contiguous
+            block of memory in either row-major (C-style) or
+            column-major (Fortran-style) order.
+            By default, NumPy uses row-major order.
 
         Returns:
             A Numba signature and a code generation function that returns a void pointer
-            to the array's data.
+            to the first element of the contiguous block of memory that stores the array's
+            data in row-major order by default.
         """
         if not isinstance(arr, numba.types.Array):
             raise TypeError("Expected a NumPy array")
 
         def codegen(context, builder, signature, args):
+            """Generate LLVM IR code to convert a NumPy array to a void* pointer.
+
+            This function generates the necessary LLVM IR instructions to:
+            1. Allocate memory for the array on the stack.
+            2. Cast the allocated memory to a void* pointer.
+
+            Args:
+                context: The LLVM context.
+                builder: The LLVM IR builder.
+                signature: The function signature.
+                args: The input arguments (NumPy array).
+
+            Returns:
+                A void* pointer to the array's data.
+            """
             [arr] = args
             raw_ptr = numba.core.cgutils.alloca_once_value(builder, arr)
             void_ptr = builder.bitcast(raw_ptr, context.get_value_type(numba.types.voidptr))

From 7914fbe5a6e031b185b7feac8e1d50d82ee2982f Mon Sep 17 00:00:00 2001
From: Claus Susanne <sclaus@Clauss-MacBook-Pro.local>
Date: Fri, 7 Mar 2025 16:30:18 +0100
Subject: [PATCH 10/10] add test to use a struct in C-function similar to
 tabulate_tensor using void*

---
 test/test_custom_data.py | 114 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 114 insertions(+)
 create mode 100644 test/test_custom_data.py

diff --git a/test/test_custom_data.py b/test/test_custom_data.py
new file mode 100644
index 000000000..1107fb652
--- /dev/null
+++ b/test/test_custom_data.py
@@ -0,0 +1,114 @@
+# Copyright (C) 2024 Susanne Claus
+#
+# This file is part of FFCx. (https://www.fenicsproject.org)
+#
+# SPDX-License-Identifier:    LGPL-3.0-or-later
+
+import numpy as np
+from cffi import FFI
+
+# Define custom tabulate tensor function in C with a struct
+# Step 1: Define the function in C and set up the CFFI builder
+ffibuilder = FFI()
+ffibuilder.set_source(
+    "_cffi_kernelA",
+    r"""
+    typedef struct {
+        uint8_t size;
+        double* values;
+    } cell_data;
+
+    void tabulate_tensor_integral_add_values(double* restrict A,
+                                            const double* restrict w,
+                                            const double* restrict c,
+                                            const double* restrict coordinate_dofs,
+                                            const int* restrict entity_local_index,
+                                            const uint8_t* restrict quadrature_permutation,
+                                            void* custom_data)
+    {
+        // Cast the void* custom_data to cell_data*
+        cell_data* custom_data_ptr = (cell_data*)custom_data;
+
+        // Access the custom data
+        uint8_t size = custom_data_ptr->size;
+        double* values = custom_data_ptr->values;
+
+        // Use the values in your computations
+        for (uint8_t i = 0; i < size; i++) {
+            A[0] += values[i];
+        }
+    }
+    """,
+)
+ffibuilder.cdef(
+    """
+    typedef struct {
+        uint8_t size;
+        double* values;
+    } cell_data;
+
+    void tabulate_tensor_integral_add_values(double* restrict A,
+                                            const double* restrict w,
+                                            const double* restrict c,
+                                            const double* restrict coordinate_dofs,
+                                            const int* restrict entity_local_index,
+                                            const uint8_t* restrict quadrature_permutation,
+                                            void* custom_data);
+    """
+)
+
+# Step 2: Compile the C code
+ffibuilder.compile(verbose=True)
+
+
+def test_tabulate_tensor_integral_add_values():
+    # Step 3: Import the compiled library
+    from _cffi_kernelA import ffi, lib
+
+    # Define cell data
+    size = 2
+    values = np.array([2.0, 1.0], dtype=np.float64)
+    expected_result = np.array([3.0], dtype=np.float64)
+
+    # Define the input arguments
+    A = np.zeros(1, dtype=np.float64)
+    w = np.array([1.0], dtype=np.float64)
+    c = np.array([0.0], dtype=np.float64)
+    coordinate_dofs = np.array(
+        [0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0], dtype=np.float64
+    )
+    entity_local_index = np.array([0], dtype=np.int32)
+    quadrature_permutation = np.array([0], dtype=np.uint8)
+
+    # Cast the arguments to the appropriate C types
+    A_ptr = ffi.cast("double*", A.ctypes.data)
+    w_ptr = ffi.cast("double*", w.ctypes.data)
+    c_ptr = ffi.cast("double*", c.ctypes.data)
+    coordinate_dofs_ptr = ffi.cast("double*", coordinate_dofs.ctypes.data)
+    entity_local_index_ptr = ffi.cast("int*", entity_local_index.ctypes.data)
+    quadrature_permutation_ptr = ffi.cast("uint8_t*", quadrature_permutation.ctypes.data)
+
+    # Use ffi.from_buffer to create a CFFI pointer from the NumPy array
+    values_ptr = ffi.from_buffer(values)
+
+    # Allocate memory for the struct
+    custom_data = ffi.new("cell_data*")
+    custom_data.size = size
+    custom_data.values = values_ptr
+
+    # Cast the struct to void*
+    custom_data_ptr = ffi.cast("void*", custom_data)
+
+    # Call the function
+    lib.tabulate_tensor_integral_add_values(
+        A_ptr,
+        w_ptr,
+        c_ptr,
+        coordinate_dofs_ptr,
+        entity_local_index_ptr,
+        quadrature_permutation_ptr,
+        custom_data_ptr,
+    )
+
+    # Assert the result
+    np.testing.assert_allclose(A, expected_result, rtol=1e-5)