Merge pull request #1059 from Antoinemarteau/master

JordiManyer · web-flow · commit 900979650caa · 2024-12-02T09:32:08.000+11:00
optimized MonomialBases evaluations
diff --git a/NEWS.md b/NEWS.md
@@ -17,6 +17,9 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Fixed #974, an error when weak form is real but unknown vector is complex. Since PR[#1050](https://github.com/gridap/Gridap.jl/pull/1050).
 - Fixed issue where barycentric refinement rule in 3D would not produce oriented meshes. Since PR[#1055](https://github.com/gridap/Gridap.jl/pull/1055).
 
+### Changed
+- Optimized MonomialBasis low-level functions. Since PR[#1059](https://github.com/gridap/Gridap.jl/pull/1059).
+
 ## [0.18.7] - 2024-10-8
 
 ### Added
diff --git a/benchmark/Project.toml b/benchmark/Project.toml
@@ -2,3 +2,4 @@
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
 Gridap = "56d4f2e9-7ea1-5844-9cf6-b9c51ca7ce8e"
 PkgBenchmark = "32113eaa-f34f-5b0d-bd6c-c81e245fc73d"
+StaticArrays = "90137ffa-7385-5640-81b9-e52037218182"
diff --git a/benchmark/benchmarks.jl b/benchmark/benchmarks.jl
@@ -12,3 +12,4 @@ end
 const SUITE = BenchmarkGroup()
 
 @include_bm SUITE "bm_assembly"
+@include_bm SUITE "bm_monomial_basis"
diff --git a/benchmark/bm/bm_monomial_basis.jl b/benchmark/bm/bm_monomial_basis.jl
@@ -0,0 +1,190 @@
+module bm_monomial_basis
+
+using PkgBenchmark, BenchmarkTools
+using Gridap
+using Gridap.Polynomials
+using Gridap.TensorValues
+using StaticArrays
+
+################################################
+# src/Polynomials/MonomialBasis.jl: _set_value_!
+################################################
+
+gradient_type = Gridap.Fields.gradient_type
+
+_set_value! = Gridap.Polynomials._set_value!
+
+function set_value_driver(f,T,D,x,n)
+  k = 1
+  s = one(T)
+  for i in 1:n
+    k = f(x,s,k)
+  end
+end
+
+function set_value_benchmarkable(D, T, V, n)
+  C = num_indep_components(V)
+  x = zeros(V,n*C)
+  return @benchmarkable set_value_driver($_set_value!,$T,$D,$x,$n)
+end
+
+##################################################
+# src/Polynomials/ModalC0Bases.jl: _set_value_mc0!
+##################################################
+
+_set_value_mc0! = Gridap.Polynomials._set_value_mc0!
+
+function set_value_mc0_driver(f,T,D,x,n)
+  k = 1
+  s = one(T)
+  for i in 1:n
+    k = f(x,s,k,2)
+  end
+end
+
+function set_value_mc0_benchmarkable(D, T, V, n)
+  C = num_indep_components(V)
+  x = zeros(V,2*n*C)
+  return @benchmarkable set_value_mc0_driver($_set_value_mc0!,$T,$D,$x,$n)
+end
+
+###################################################
+# src/Polynomials/MonomialBasis.jl: _set_gradient!
+###################################################
+
+ _set_gradient! = Gridap.Polynomials. _set_gradient!
+
+function set_gradient_driver(f,T,D,V,x,n)
+  k = 1
+  s = VectorValue{D,T}(ntuple(_->one(T),D))
+  for i in 1:n
+    k = f(x,s,k,V)
+  end
+end
+
+function set_gradient_benchmarkable(D, T, V, n)
+  C = num_indep_components(V)
+  G = gradient_type(V, zero(Point{D,T}))
+  x = zeros(G,n*C);
+  return @benchmarkable set_gradient_driver($_set_gradient!,$T,$D,$V,$x,$n)
+end
+
+#####################################################
+# src/Polynomials/ModalC0Bases.jl: _set_gradient_mc0!
+#####################################################
+
+ _set_gradient_mc0! = Gridap.Polynomials. _set_gradient_mc0!
+
+function set_gradient_mc0_driver(f,T,D,V,x,n)
+  k = 1
+  s = VectorValue{D,T}(ntuple(_->one(T),D))
+  for i in 1:n
+    k = f(x,s,k,1,V)
+  end
+end
+
+function set_gradient_mc0_benchmarkable(D, T, V, n)
+  C = num_indep_components(V)
+  G = gradient_type(V, zero(Point{D,T}))
+  x = zeros(G,n*C);
+  return @benchmarkable set_gradient_mc0_driver($_set_gradient_mc0!,$T,$D,$V,$x,$n)
+end
+
+#################################################
+# src/Polynomials/MonomialBasis.jl: _evaluate_1d!
+#################################################
+
+_evaluate_1d! = Gridap.Polynomials._evaluate_1d!
+
+function evaluate_1d_driver(f,order,D,v,x_vec)
+  for x in x_vec
+    f(v,x,order,D)
+  end
+end
+
+function evaluate_1d_benchmarkable(D, T, V, n)
+  n = Integer(n/50)
+  order = num_indep_components(V)
+  v = zeros(D,order+1);
+  x = rand(MVector{n,T})
+  return @benchmarkable evaluate_1d_driver($_evaluate_1d!,$order,$D,$v,$x)
+end
+
+################################################
+# src/Polynomials/MonomialBasis.jl:_gradient_1d!
+################################################
+
+_gradient_1d! = Gridap.Polynomials._gradient_1d!
+
+function gradient_1d_driver(f,order,D,v,x_vec)
+  for x in x_vec
+    f(v,x,order,D)
+  end
+end
+
+function gradient_1d_benchmarkable(D, T, V, n)
+  n = Integer(n/10)
+  order = num_indep_components(V)
+  v = zeros(D,order+1);
+  x = rand(MVector{n,T})
+  return @benchmarkable gradient_1d_driver($_gradient_1d!,$order,$D,$v,$x)
+end
+
+################################################
+# src/Polynomials/MonomialBasis.jl:_hessian_1d!
+################################################
+
+_hessian_1d! = Gridap.Polynomials._hessian_1d!
+
+function hessian_1d_driver(f,order,D,v,x_vec)
+  for x in x_vec
+    f(v,x,order,D)
+  end
+end
+
+function hessian_1d_benchmarkable(D, T, V, n)
+  n = Integer(n/10)
+  order = num_indep_components(V)
+  v = zeros(D,order+1);
+  x = rand(MVector{n,T})
+  return @benchmarkable hessian_1d_driver($_hessian_1d!,$order,$D,$v,$x)
+end
+
+#####################
+# benchmarkable suite
+#####################
+
+const SUITE = BenchmarkGroup()
+
+const benchmarkables = (
+  set_value_benchmarkable,
+  set_value_mc0_benchmarkable,
+  set_gradient_benchmarkable,
+  set_gradient_mc0_benchmarkable,
+  evaluate_1d_benchmarkable,
+  gradient_1d_benchmarkable,
+  hessian_1d_benchmarkable
+)
+
+const dims=(1, 2, 3, 5, 8)
+const n = 3000
+const T = Float64
+
+for benchable in benchmarkables
+  for D in dims
+    TV = [
+      VectorValue{D,T},
+      TensorValue{D,D,T,D*D},
+      SymTensorValue{D,T,Integer(D*(D+1)/2)},
+      SymTracelessTensorValue{D,T,Integer(D*(D+1)/2)}
+    ]
+
+    for V in TV
+      if V == SymTracelessTensorValue{1,T,1} continue end # no dofs
+      name = "monomial_basis_$(D)D_$(V)_$(benchable)"
+      SUITE[name] = benchable(D, T, V, n)
+    end
+  end
+end
+
+end # module
diff --git a/src/Polynomials/ModalC0Bases.jl b/src/Polynomials/ModalC0Bases.jl
@@ -393,16 +393,10 @@ end
 
 @inline function _set_value_mc0!(v::AbstractVector{V},s::T,k,l) where {V,T}
   ncomp = num_indep_components(V)
-  m = zero(MVector{ncomp,T})
   z = zero(T)
-  js = 1:ncomp
-  for j in js
-    for i in js
-      @inbounds m[i] = z
-    end
-    @inbounds m[j] = s
-    i = k+l*(j-1)
-    @inbounds v[i] = Tuple(m)
+  for j in 1:ncomp
+    m = k+l*(j-1)
+    @inbounds v[m] = ntuple(i -> ifelse(i == j, s, z),Val(ncomp))
   end
   k+1
 end
@@ -466,25 +460,36 @@ end
 # Indexing and m definition should be fixed if G contains symmetries, that is
 # if the code is  optimized for symmetric tensor V valued FESpaces
 # (if gradient_type(V) returned a symmetric higher order tensor type G)
-@inline function _set_gradient_mc0!(
+@inline @generated function _set_gradient_mc0!(
   v::AbstractVector{G},s,k,l,::Type{V}) where {V,G}
+  # Git blame me for readable non-generated version
   @notimplementedif num_indep_components(G) != num_components(G) "Not implemented for symmetric Jacobian or Hessian"
-
-  T = eltype(s)
-  m = zero(Mutable(G))
-  w = zero(V)
-  z = zero(T)
-  for (ij,j) in enumerate(CartesianIndices(w))
+  
+  m = Array{String}(undef, size(G))
+  N_val_dims = length(size(V))
+  s_size = size(G)[1:end-N_val_dims]
+
+  body = "T = eltype(s); z = zero(T);"
+  for ci in CartesianIndices(s_size)
+    id = join(Tuple(ci))
+    body *= "@inbounds s$id = s[$ci];"
+  end
+  
+  V_size = size(V)
+  for (ij,j) in enumerate(CartesianIndices(V_size))
     for i in CartesianIndices(m)
-      @inbounds m[i] = z
+      m[i] = "z"
     end
-    for i in CartesianIndices(s)
-      @inbounds m[i,j] = s[i]
+    for ci in CartesianIndices(s_size)
+      id = join(Tuple(ci))
+      m[ci,j] = "s$id"
     end
-    i = k+l*(ij-1)
-    @inbounds v[i] = m
+    body *= "i = k + l*($ij-1);"
+    body *= "@inbounds v[i] = ($(join(tuple(m...), ", ")));"
   end
-  k+1
+
+  body = Meta.parse(string("begin ",body," end"))
+  return Expr(:block, body ,:(return k+1))
 end
 
 function _hessian_nd_mc0!(
diff --git a/src/Polynomials/MonomialBases.jl b/src/Polynomials/MonomialBases.jl

Original file line number	Diff line number	Diff line change
`@@ -12,3 +12,4 @@ end`
`12`	`12`	`const SUITE = BenchmarkGroup()`
`13`	`13`
`14`	`14`	`@include_bm SUITE "bm_assembly"`
	`15`	`+@include_bm SUITE "bm_monomial_basis"`