Fixed formatting errors and updated mesh coordinate transformation and operator setup

KartikiP · web-flow · commit 5c36feb8e1c3 · 2025-12-09T09:36:55.000-08:00
Fixed mesh transformation and operator application logic.
diff --git a/julia/LibCEED.jl/examples/ex3-volume.jl b/julia/LibCEED.jl/examples/ex3-volume.jl
@@ -1,180 +1,195 @@
 using LibCEED, Printf
 
-include("common.jl")
+include("common.jl")   # defines helper functions: create_tensor_h1_lagrange_basis,
+                       # build_cartesian_restriction, get_cartesian_mesh_size, etc.
 
 function transform_mesh_coords!(dim, mesh_size, mesh_coords)
-     @witharray coords = mesh_coords begin
+    @witharray coords = mesh_coords begin
         if dim == 1
             for i = 1:mesh_size
-                # map [0,1] to [0,1] varying the mesh density
                 coords[i] = 0.5 + 1.0/sqrt(3.0)*sin((2.0/3.0)*pi*(coords[i] - 0.5))
             end
             exact_volume = 1.0
         else
-            num_nodes = mesh_size÷dim
+            num_nodes = mesh_size ÷ dim
             @inbounds @simd for i = 1:num_nodes
-                # map (x,y) from [0,1]x[0,1] to the quarter annulus with polar
-                # coordinates, (r,phi) in [1,2]x[0,pi/2] with area = 3/4*pi
-                u = coords[i]
-                v = coords[i+num_nodes]
-                u = 1.0 + u
-                v = pi/2*v
-                coords[i] = u*cos(v)
-                coords[i+num_nodes] = u*sin(v)
+                u = coords[i]            # ξ ∈ [0,1]
+                v = coords[i+num_nodes]  # η ∈ [0,1]
+                r = 1.0 + u
+                θ = (pi/2) * v
+                coords[i]           = r * cos(θ)
+                coords[i+num_nodes] = r * sin(θ)
             end
-            exact_volume = 3.0/4.0*pi
+            exact_volume = 3.0/4.0 * pi
         end
         return exact_volume
     end
 end
 
-function run_ex3(; ceed_spec, dim, mesh_order, sol_order, num_qpts, prob_size, gallery)
-    # Main implementation goes here
-    ncompx = dim
+function run_ex3(; ceed_spec="/cpu/self", dim=2, mesh_order=3, sol_order=3,
+                 num_qpts=4, prob_size=-1, gallery=false)
+
     prob_size < 0 && (prob_size = 256*1024)
+    ncompx = dim
 
     ceed = Ceed(ceed_spec)
-    mesh_basis = 
-    create_tensor_h1_lagrange_basis(ceed, dim, ncompx, mesh_order + 1, num_qpts, GAUSS)
-    sol_basis = 
-    create_tensor_h1_lagrange_basis(ceed, dim, 1, sol_order + 1, num_qpts, GAUSS)
 
-    nxyz = get_cartesian_mesh_size(dim, sol_order, prob_size) 
-    println("Mesh size:",nxyz)
+    
+    # Bases
+    
+    mesh_basis = create_tensor_h1_lagrange_basis(ceed, dim, ncompx, mesh_order + 1, num_qpts, GAUSS)
+    sol_basis  = create_tensor_h1_lagrange_basis(ceed, dim, 1,       sol_order + 1,  num_qpts, GAUSS)
+
+  
+    # Mesh size & restrictions
+  
+    nxyz = get_cartesian_mesh_size(dim, sol_order, prob_size)
+    println("Mesh size: ", nxyz)
 
-    #Build CeedElemRestriction objects describing the mesh and solution discrete
-    # mesh_rstr: for building (no qdata restriction needed)
     mesh_size, mesh_rstr, _ = build_cartesian_restriction(ceed, dim, nxyz, mesh_order, ncompx, num_qpts)
 
-   # sol_rstr + sol_rstr_i: for solving
-    sol_size, sol_rstr, sol_rstr_i = build_cartesian_restriction(
-        ceed, dim, nxyz, sol_order, 1, num_qpts, mode=RestrictionAndStrided
-    )
+    sol_size, sol_rstr, _ = build_cartesian_restriction(
+        ceed, dim, nxyz, sol_order, 1, num_qpts, mode=RestrictionAndStrided)
+
+    # Physical mesh coordinates + exact volume
 
-   # mesh_coords
     mesh_coords = CeedVector(ceed, mesh_size)
     set_cartesian_mesh_coords!(dim, nxyz, mesh_order, mesh_coords)
     exact_vol = transform_mesh_coords!(dim, mesh_size, mesh_coords)
 
-    #Create the Q-function that builds the mass operator ( i.e it computes the quadrature data) and set its context data.
-    num_q_comp = 1 + div(dim*(dim+1), 2)
+  
+    num_q_comp = 1 + div(dim*(dim + 1), 2)   # 1 for detJ (mass), rest for symmetric JᵀJ
+    num_elem   = prod(nxyz)
+    elem_qpts  = num_qpts^dim
+
+    qdata_size = num_elem * elem_qpts * num_q_comp
+    qdata = CeedVector(ceed, qdata_size)
+    qdata[] = 0.0
+
+    # Strided restriction: one "node" per quadrature point, num_q_comp components
+    qdata_rstr = create_elem_restriction_strided(
+        ceed,
+        num_elem,
+        elem_qpts,          # nodes per element = quadrature points
+        num_q_comp,         # components per quadrature point
+        qdata_size,
+        CeedInt[1, num_q_comp, num_q_comp * elem_qpts]  # strides: [comp, elem, total]
+    )
+
     
     @interior_qf build_qfunc = (
         ceed,
         dim=dim,
-        (dx, :in, EVAL_GRAD, dim, dim),      # ← THIS LINE: dx input
-        (weights, :in, EVAL_WEIGHT),         # ← weights input
-        (qdata, :out, EVAL_NONE, num_q_comp), # ← qdata output
+        (dx,      :in,  EVAL_GRAD,    dim, dim),
+        (weights, :in,  EVAL_WEIGHT),
+        (qdata,   :out, EVAL_NONE,   num_q_comp),
         begin
-            # Compute determinant
-            det_J = det(dx)
-            
-            # Store mass component
-            qdata[1] = weights * det_J
-            
-            # Store diffusion components (J^T * J)
-            idx = 2
+            # det(J)
+            if dim == 1
+                detJ = dx[1,1]
+            elseif dim == 2
+                detJ = dx[1,1]*dx[2,2] - dx[1,2]*dx[2,1]
+            else
+                detJ = (dx[1,1]*(dx[2,2]*dx[3,3] - dx[2,3]*dx[3,2]) -
+                        dx[1,2]*(dx[2,1]*dx[3,3] - dx[2,3]*dx[3,1]) +
+                        dx[1,3]*(dx[2,1]*dx[3,2] - dx[2,2]*dx[3,1]))
+            end
+
+            qdata[1] = weights * detJ   # mass contribution
+
+            # Upper triangle of JᵀJ (symmetric storage)
+            k = 2
             for i = 1:dim
                 for j = i:dim
-                    qdata[idx] = dx[:, i]' * dx[:, j]
-                    idx += 1
+                    s = zero(eltype(dx))
+                    @inbounds @simd for m = 1:dim
+                        s += dx[m,i] * dx[m,j]
+                    end
+                    qdata[k] = s
+                    k += 1
                 end
             end
-        end,
+        end
     )
 
-    #Create the operator that builds the quadrature data for the mass operator
     build_oper = Operator(
         ceed,
         qf=build_qfunc,
         fields=[
-            (:dx, mesh_rstr, mesh_basis, CeedVectorActive()),
+            (:dx,      mesh_rstr, mesh_basis, mesh_coords),
             (:weights, ElemRestrictionNone(), mesh_basis, CeedVectorNone()),
-            (:qdata, sol_rstr_i, BasisNone(), CeedVectorActive()),
+            (:qdata,   qdata_rstr, BasisNone(), qdata),
         ],
     )
 
-    # Apply to get qdata
-    elem_qpts = num_qpts^dim
-    num_elem = prod(nxyz)
-    qdata = CeedVector(ceed, num_elem * elem_qpts * num_q_comp)
-    print("Computing the quadrature data for the mass operator ...")
+    print("Computing quadrature data ... ")
     flush(stdout)
     apply!(build_oper, mesh_coords, qdata)
-    println(" done.")
+    println("done.")
 
-    #Create QFunction for applying the mass+diffusion operator
     @interior_qf apply_qfunc = (
         ceed,
         dim=dim,
-        (u, :in, EVAL_INTERP),
-        (du, :in, EVAL_GRAD, dim),
-        (qdata, :in, EVAL_NONE, num_q_comp),
-        (v, :out, EVAL_INTERP),
-        (dv, :out, EVAL_GRAD, dim),
+        (u,     :in,  EVAL_INTERP),
+        (du,    :in,  EVAL_GRAD, dim),
+        (qdata, :in,  EVAL_NONE, num_q_comp),
+        (v,     :out, EVAL_INTERP),
+        (dv,    :out, EVAL_GRAD, dim),
         begin
-            # Apply mass: v = qdata[1] * u
-            v .= qdata[1] .* u
-            
-            # Apply diffusion: dv = (qdata[2:end]) * du
-            # The qdata contains the symmetric diffusion tensor (J^T*J)
-            # dv_i = sum_j (J^T*J)_{i,j} * du_j
-            
-            # For efficiency, rebuild the matrix from stored components
+            v .= qdata[1] .* u                     # mass part
+
+            # diffusion part: reconstruct symmetric matrix from upper triangle
             idx = 2
             for i = 1:dim
-                dv_i = 0.0
+                acc = zero(eltype(dv))
                 for j = 1:dim
-                    # Reconstruct symmetric matrix element
                     if j >= i
-                        mat_idx = idx + div((j-1)*j, 2) + (i-1)
+                        mat_idx = idx + (j*(j-1))÷2 + (i-1)
                     else
-                        mat_idx = idx + div((i-1)*i, 2) + (j-1)
+                        mat_idx = idx + (i*(i-1))÷2 + (j-1)
                     end
-                    dv_i += qdata[mat_idx] * du[j]
+                    acc += qdata[mat_idx] * du[j]
                 end
-                dv[i] = dv_i
+                dv[i] = acc
             end
-        end,
+        end
     )
+
     apply_oper = Operator(
-    ceed,
-    qf=apply_qfunc,
-    fields=[
-        (:u, sol_rstr, sol_basis, CeedVectorActive()),
-        (:du, sol_rstr, sol_basis, CeedVectorActive()),
-        (:qdata, sol_rstr_i, BasisNone(), qdata),
-        (:v, sol_rstr, sol_basis, CeedVectorActive()),
-        (:dv, sol_rstr, sol_basis, CeedVectorActive()),
-    ],
-)
+        ceed,
+        qf=apply_qfunc,
+        fields=[
+            (:u,     sol_rstr,  sol_basis,  CeedVectorActive()),
+            (:du,    sol_rstr,  sol_basis,  CeedVectorActive()),
+            (:qdata, qdata_rstr, BasisNone(), qdata),
+            (:v,     sol_rstr,  sol_basis,  CeedVectorActive()),
+            (:dv,    sol_rstr,  sol_basis,  CeedVectorActive()),
+        ],
+    )
 
-# # Compute the mesh volume using the massdiff operator
-    print("Computing the mesh volume using the formula: vol = 1^T * (M + K) * 1...")
-    flush(stdout)
-    
-    u = CeedVector(ceed, sol_size)
-    v = CeedVector(ceed, sol_size)
-    u[] = 1.0
-    
-    # Apply operator
-    apply!(apply_oper, u, v)
     
-    # Compute volume
-    vol = witharray_read(sum, v, MEM_HOST)
-    
-    @printf("Exact mesh volume    : % .14g\n", exact_vol)
-    @printf("Computed mesh volume : % .14g\n", vol)
-    @printf("Volume error         : % .14g\n", vol - exact_vol)
+    print("Computing volume via 1ᵀ (M + K) 1 ... ")
+    flush(stdout)
+    u_vec = CeedVector(ceed, sol_size)
+    v_vec = CeedVector(ceed, sol_size)
+
+    u_vec[] = 1.0
+    apply!(apply_oper, u_vec, v_vec)
+
+    computed_vol = witharray_read(sum, v_vec, MEM_HOST)
+    @printf("Exact mesh volume    : %.14g\n", exact_vol)
+    @printf("Computed mesh volume : %.14g\n", computed_vol)
+    @printf("Volume error         : %.14g\n", computed_vol - exact_vol)
 end
 
-# Entry point
+
+# Run
+
 run_ex3(
-    ceed_spec="/cpu/self",
-    dim=2,
-    mesh_order=2,
-    sol_order=2,
-    num_qpts=3,
-    prob_size=-1,
-    gallery=false,
+    ceed_spec  = "/cpu/self",   # use "/gpu/cuda" or "/gpu/hip" if available
+    dim        = 2,
+    mesh_order = 3,
+    sol_order  = 3,
+    num_qpts   = 4,
+    prob_size  = -1,            # -1 → auto-size (~256K dofs)
 )