5

Roushelfy · Roushelfy · commit fd53a05738f5 · 2024-06-26T20:18:49.000-04:00
diff --git a/simulators/4_friction/CMakeLists.txt b/simulators/4_friction/CMakeLists.txt
@@ -1,18 +1,18 @@
-add_executable(4_friction_debug)
+add_executable(4_friction)
 
-target_compile_options(4_friction_debug PRIVATE -g)
-set_target_properties(4_friction_debug PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
+target_compile_options(4_friction PRIVATE -g)
+set_target_properties(4_friction PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
 
-target_link_libraries(4_friction_debug PRIVATE muda cusolver cublas cusparse )
+target_link_libraries(4_friction PRIVATE muda cusolver cublas cusparse )
 
 option(BUILD_SHARED_LIBS "Build shared libraries" OFF)
 
 include_directories(include)
 
-file(GLOB_RECURSE 4_friction_debug_CU_SOURCE CONFIGURE_DEPENDS "src/*.cu")
-target_sources(4_friction_debug PRIVATE ${4_friction_debug_CU_SOURCE})
+file(GLOB_RECURSE 4_friction_CU_SOURCE CONFIGURE_DEPENDS "src/*.cu")
+target_sources(4_friction PRIVATE ${4_friction_CU_SOURCE})
 
-file(GLOB_RECURSE 4_friction_debug_CPP_SOURCE CONFIGURE_DEPENDS "src/*.cpp")
-target_sources(4_friction_debug PRIVATE ${4_friction_debug_CPP_SOURCE})
+file(GLOB_RECURSE 4_friction_CPP_SOURCE CONFIGURE_DEPENDS "src/*.cpp")
+target_sources(4_friction PRIVATE ${4_friction_CPP_SOURCE})
 
-target_link_libraries(4_friction_debug PRIVATE sfml-graphics)
+target_link_libraries(4_friction PRIVATE sfml-graphics)
diff --git a/simulators/4_friction/src/main.cpp b/simulators/4_friction/src/main.cpp
@@ -2,7 +2,7 @@
 
 int main()
 {
-	float rho = 1000, k = 4e4, initial_stretch = 1, n_seg = 8, h = 0.01, side_len = 1, tol = 0.01, mu = 0.11;
+	float rho = 1000, k = 4e4, initial_stretch = 1, n_seg = 14, h = 0.01, side_len = 1, tol = 0.01, mu = 0.11;
 	// printf("Running mass-spring simulator with parameters: rho = %f, k = %f, initial_stretch = %f, n_seg = %d, h = %f, side_len = %f, tol = %f\n", rho, k, initial_stretch, n_seg, h, side_len, tol);
 	FrictionSimulator<float, 2> simulator(rho, side_len, initial_stretch, k, h, tol, mu, n_seg);
 	simulator.run();
diff --git a/simulators/5_mov_dirichlet/include/SpringEnergy.h b/simulators/5_mov_dirichlet/include/SpringEnergy.h
@@ -18,6 +18,7 @@ class SpringEnergy
     SpringEnergy &operator=(SpringEnergy &&rhs);
 
     void update_x(const DeviceBuffer<T> &x);
+    void update_DBC_target();
     T val();                                 // Calculate the value of the energy
     const DeviceBuffer<T> &grad();           // Calculate the gradient of the energy
     const DeviceTripletMatrix<T, 1> &hess(); // Calculate the Hessian matrix of the energy
diff --git a/simulators/5_mov_dirichlet/include/simulator.h b/simulators/5_mov_dirichlet/include/simulator.h
@@ -5,14 +5,14 @@
 #include "square_mesh.h"
 #include <iostream>
 template <typename T, int dim>
-class FrictionSimulator
+class MovDirichletSimulator
 {
 public:
-    FrictionSimulator();
-    ~FrictionSimulator();
-    FrictionSimulator(FrictionSimulator &&rhs);
-    FrictionSimulator &operator=(FrictionSimulator &&rhs);
-    FrictionSimulator(T rho, T side_len, T initial_stretch, T K, T h, T tol, T mu, int n_seg);
+    MovDirichletSimulator();
+    ~MovDirichletSimulator();
+    MovDirichletSimulator(MovDirichletSimulator &&rhs);
+    MovDirichletSimulator &operator=(MovDirichletSimulator &&rhs);
+    MovDirichletSimulator(T rho, T side_len, T initial_stretch, T K, T h, T tol, T mu, int n_seg);
     void run();
 
 private:
diff --git a/simulators/5_mov_dirichlet/src/BarrierEnergy.cu b/simulators/5_mov_dirichlet/src/BarrierEnergy.cu
@@ -11,7 +11,7 @@ template <typename T, int dim>
 struct BarrierEnergy<T, dim>::Impl
 {
 	DeviceBuffer<T> device_x;
-	DeviceBuffer<T> device_contact_area, device_n, device_o;
+	DeviceBuffer<T> device_contact_area, device_n,device_n_ceil, device_o;
 	int N;
 	DeviceBuffer<T> device_grad;
 	DeviceTripletMatrix<T, 1> device_hess;
@@ -38,9 +38,12 @@ BarrierEnergy<T, dim>::BarrierEnergy(const std::vector<T> &x, const std::vector<
 	pimpl_->N = x.size() / dim;
 	pimpl_->device_x.copy_from(x);
 	pimpl_->device_contact_area.copy_from(contact_area);
+	std::vector<T> n_ceil(dim);
+	n_ceil[1]=-1;
+	pimpl_->device_n_ceil.copy_from(n_ceil);
 	pimpl_->device_n.copy_from(n);
 	pimpl_->device_o.copy_from(o);
-	pimpl_->device_hess.resize_triplets(pimpl_->N * dim * dim);
+	pimpl_->device_hess.resize_triplets((pimpl_->N *2-1)* dim * dim);
 	pimpl_->device_hess.reshape(x.size(), x.size());
 	pimpl_->device_grad.resize(pimpl_->N * dim);
 }
@@ -57,20 +60,32 @@ T BarrierEnergy<T, dim>::val()
 	auto &device_x = pimpl_->device_x;
 	auto &device_contact_area = pimpl_->device_contact_area;
 	auto &device_n = pimpl_->device_n;
+	auto &device_n_ceil = pimpl_->device_n_ceil;
 	auto &device_o = pimpl_->device_o;
 	int N = device_x.size() / dim;
-	DeviceBuffer<T> device_val(N);
-	ParallelFor(256).apply(N, [device_val = device_val.viewer(), device_x = device_x.cviewer(), device_contact_area = device_contact_area.cviewer(), device_n = device_n.cviewer(), device_o = device_o.cviewer()] __device__(int i) mutable
+	DeviceBuffer<T> device_val1(N);
+	DeviceBuffer<T> device_val2(N);
+	ParallelFor(256).apply(N, [device_val1 = device_val1.viewer(), device_x = device_x.cviewer(), device_contact_area = device_contact_area.cviewer(), device_n = device_n.cviewer(), device_o = device_o.cviewer()] __device__(int i) mutable
 						   { T d = 0;
 						   for(int j=0;j<dim;j++){
 							   d += device_n(j)*(device_x(i*dim+j)-device_o(j));
 						   }
 						   if(d<dhat){
 							   T s = d / dhat;
-							   device_val(i)= kappa * device_contact_area(i) * dhat/2*(s-1)*log(s);
+							   device_val1(i)= kappa * device_contact_area(i) * dhat/2*(s-1)*log(s);
 						   } })
 		.wait();
-	return devicesum(device_val);
+	ParallelFor(256).apply(N-1, [device_val2 = device_val2.viewer(), device_x = device_x.cviewer(), device_contact_area = device_contact_area.cviewer(), device_n_ceil = device_n_ceil.cviewer(), device_o = device_o.cviewer(),N] __device__(int i) mutable
+						   { T d = 0;
+						   for(int j=0;j<dim;j++){
+							   d += device_n_ceil(j)*(device_x(i*dim+j)-device_x((N-1)*dim+j));
+						   }
+						   if(d<dhat){
+							   T s = d / dhat;
+							   device_val2(i)= kappa * device_contact_area(i) * dhat/2*(s-1)*log(s);
+						   } })
+		.wait();
+	return devicesum(device_val1)+devicesum(device_val2);
 } // Calculate the energy
 
 template <typename T, int dim>
@@ -80,6 +95,7 @@ const DeviceBuffer<T> &BarrierEnergy<T, dim>::grad()
 	auto &device_contact_area = pimpl_->device_contact_area;
 	int N = device_x.size() / dim;
 	auto &device_n = pimpl_->device_n;
+	auto &device_n_ceil = pimpl_->device_n_ceil;
 	auto &device_o = pimpl_->device_o;
 	auto &device_grad = pimpl_->device_grad;
 	device_grad.fill(0);
@@ -99,6 +115,23 @@ const DeviceBuffer<T> &BarrierEnergy<T, dim>::grad()
 								   }
 							   } })
 		.wait();
+	ParallelFor(256).apply(N-1, [device_x = device_x.cviewer(), device_contact_area = device_contact_area.cviewer(), device_grad = device_grad.viewer(), device_n_ceil = device_n_ceil.cviewer(), device_o = device_o.cviewer(),N] __device__(int i) mutable
+
+						   {
+							   T d = 0;
+							   for(int j=0;j<dim;j++){
+								   d += device_n_ceil(j)*(device_x(i*dim+j)-device_x((N-1)*dim+j));
+							   }
+							   if (d < dhat)
+							   {
+								   T s = d / dhat;
+								   for (int j = 0; j < dim; j++)
+								   {
+									   T grad =device_contact_area(i) * dhat * (kappa / 2 * (log(s) / dhat + (s - 1) / d)) * device_n_ceil(j);
+									   device_grad(i * dim + j) += grad;
+									   device_grad((N-1) * dim + j) -= grad;
+								   }
+							   } }).wait();
 	return device_grad;
 }
 
@@ -108,6 +141,7 @@ const DeviceTripletMatrix<T, 1> &BarrierEnergy<T, dim>::hess()
 	auto &device_x = pimpl_->device_x;
 	auto &device_contact_area = pimpl_->device_contact_area;
 	auto &device_n = pimpl_->device_n;
+	auto &device_n_ceil = pimpl_->device_n_ceil;
 	auto &device_o = pimpl_->device_o;
 	auto &device_hess = pimpl_->device_hess;
 	auto device_hess_row_idx = device_hess.row_indices();
@@ -144,6 +178,35 @@ const DeviceTripletMatrix<T, 1> &BarrierEnergy<T, dim>::hess()
 				}
 			} })
 		.wait();
+	ParallelFor(256).apply(N-1, [device_x = device_x.cviewer(), device_contact_area = device_contact_area.cviewer(), device_hess_val = device_hess_val.viewer(), device_hess_row_idx = device_hess_row_idx.viewer(), device_hess_col_idx = device_hess_col_idx.viewer(), N, device_n_ceil = device_n_ceil.cviewer(), device_o = device_o.cviewer()] __device__(int i) mutable
+						   {
+		T d = 0;
+		for (int j = 0; j < dim; j++)
+		{
+			d += device_n_ceil(j) * (device_x(i * dim + j) - device_x((N-1) * dim + j));
+		}
+		if (d < dhat)
+			for (int j = 0; j < dim; j++)
+			{
+				for (int k = 0; k < dim; k++)
+				{
+					int idx =N*dim*dim+ i * dim * dim + j * dim + k;
+					device_hess_row_idx(idx) = (N-1) * dim + j;
+					device_hess_col_idx(idx) = (N-1) * dim + k;
+					device_hess_val(idx) = device_contact_area(i) * dhat * kappa / (2 * d * d * dhat) * (d + dhat) * device_n_ceil(j) * device_n_ceil(k);
+				}
+			}
+		else
+			for (int j = 0; j < dim; j++)
+			{
+				for (int k = 0; k < dim; k++)
+				{
+					int idx = N*dim*dim+i * dim * dim + j * dim + k;
+					device_hess_row_idx(idx) = (N-1) * dim + j;
+					device_hess_col_idx(idx) = (N-1) * dim + k;
+					device_hess_val(idx) = 0;
+				}
+			} }).wait();
 	return device_hess;
 
 } // Calculate the Hessian of the energy
@@ -153,6 +216,7 @@ T BarrierEnergy<T, dim>::init_step_size(const DeviceBuffer<T> &p)
 {
 	auto &device_x = pimpl_->device_x;
 	auto &device_n = pimpl_->device_n;
+	auto &device_n_ceil = pimpl_->device_n_ceil;
 	auto &device_o = pimpl_->device_o;
 	int N = device_x.size() / dim;
 	DeviceBuffer<T> device_alpha(N);
@@ -176,6 +240,26 @@ T BarrierEnergy<T, dim>::init_step_size(const DeviceBuffer<T> &p)
 			device_alpha(i) = min(device_alpha(i), 0.9 * alpha / -p_n);
 		} })
 		.wait();
+	
+	ParallelFor(256)
+		.apply(N-1, [device_x = device_x.cviewer(), p = p.cviewer(), device_alpha = device_alpha.viewer(), device_n_ceil = device_n_ceil.cviewer(), device_o = device_o.cviewer(),N] __device__(int i) mutable
+
+			   {
+		T p_n = 0;
+		for (int j = 0; j < dim; j++)
+		{
+			p_n += p(i * dim + j) * device_n_ceil(j);
+		}
+		if (p_n < 0)
+		{
+			T alpha = 0;
+			for (int j = 0; j < dim; j++)
+			{
+				alpha += device_n_ceil(j) * (device_x(i * dim + j) - device_x((N-1) * dim + j));
+			}
+			device_alpha(i) = min(device_alpha(i), 0.9 * alpha / -p_n);
+		} })
+		.wait();
 	return min_vector(device_alpha);
 }
 template class BarrierEnergy<float, 2>;
diff --git a/simulators/5_mov_dirichlet/src/SpringEnergy.cu b/simulators/5_mov_dirichlet/src/SpringEnergy.cu
@@ -15,7 +15,7 @@ struct SpringEnergy<T, dim>::Impl
     DeviceBuffer<Eigen::Matrix<T, dim, 1>> device_DBC_target;
     DeviceBuffer<T> device_grad;
     DeviceTripletMatrix<T, 1> device_hess;
-    T k;
+    T k,h;
     int N;
 };
 
@@ -36,7 +36,7 @@ SpringEnergy<T, dim>::SpringEnergy(const SpringEnergy<T, dim> &rhs)
     : pimpl_{std::make_unique<Impl>(*rhs.pimpl_)} {}
 
 template <typename T, int dim>
-SpringEnergy<T, dim>::SpringEnergy(const std::vector<T> &x, const std::vector<T> &m, const std::vector<int> &DBC, const std::vector<Eigen::Matrix<T, dim, 1>> &DBC_target, T k)
+SpringEnergy<T, dim>::SpringEnergy(const std::vector<T> &x, const std::vector<T> &m, const std::vector<int> &DBC, const std::vector<T> &DBC_target, T k,T h)
     : pimpl_{std::make_unique<Impl>()}
 {
     pimpl_->N = x.size() / dim;
@@ -45,6 +45,7 @@ SpringEnergy<T, dim>::SpringEnergy(const std::vector<T> &x, const std::vector<T>
     pimpl_->device_DBC.copy_from(DBC);
     pimpl_->device_DBC_target.copy_from(DBC_target);
     pimpl_->k = k;
+    pimpl_->h = h;
     pimpl_->device_grad.resize(pimpl_->N * dim);
     pimpl_->device_hess.resize_triplets(pimpl_->N * dim * dim);
     pimpl_->device_hess.reshape(x.size(), x.size());
@@ -56,6 +57,21 @@ void SpringEnergy<T, dim>::update_x(const DeviceBuffer<T> &x)
     pimpl_->device_x.view().copy_from(x);
 }
 
+template <typename T, int dim>
+void SpringEnergy<T, dim>::update_DBC_target()
+{
+        // for i in range(0, len(DBC)):
+        // if (DBC_limit[i] - x_n[DBC[i]]).dot(DBC_v[i]) > 0:
+        //     DBC_target.append(x_n[DBC[i]] + h * DBC_v[i])
+        // else:
+        //     DBC_target.append(x_n[DBC[i]])
+        auto &device_x = pimpl_->device_x;
+        auto &device_DBC = pimpl_->device_DBC;
+        auto &device_DBC_target = pimpl_->device_DBC_target;
+        auto h = pimpl_->h;
+
+}
+
 template <typename T, int dim>
 T SpringEnergy<T, dim>::val()
 {
@@ -75,7 +91,7 @@ T SpringEnergy<T, dim>::val()
             Eigen::Matrix<T, dim, 1> diff;
             for (int j = 0; j < dim; ++j)
             {
-                diff(j) = device_x(idx * dim + j) - device_DBC_target(i)(j);
+                diff(j) = device_x(idx * dim + j) - device_DBC_target(i*dim + j);
             }
             device_val(i) = 0.5 * k * device_m(idx) * diff.dot(diff); })
         .wait();
@@ -102,7 +118,7 @@ const DeviceBuffer<T> &SpringEnergy<T, dim>::grad()
             Eigen::Matrix<T, dim, 1> grad;
             for (int j = 0; j < dim; ++j)
             {
-                grad(j) = device_x(idx * dim + j) - device_DBC_target(i)(j);
+                grad(j) = device_x(idx * dim + j) - device_DBC_target(i*dim + j);
             }
             grad *= k * device_m(idx);
             for (int j = 0; j < dim; ++j)
diff --git a/simulators/5_mov_dirichlet/src/simulator.cu b/simulators/5_mov_dirichlet/src/simulator.cu

Original file line number	Diff line number	Diff line change
`@@ -2,7 +2,7 @@`
`2`	`2`
`3`	`3`	`int main()`
`4`	`4`	`{`
`5`		`- float rho = 1000, k = 4e4, initial_stretch = 1, n_seg = 8, h = 0.01, side_len = 1, tol = 0.01, mu = 0.11;`
	`5`	`+ float rho = 1000, k = 4e4, initial_stretch = 1, n_seg = 14, h = 0.01, side_len = 1, tol = 0.01, mu = 0.11;`
`6`	`6`	`// printf("Running mass-spring simulator with parameters: rho = %f, k = %f, initial_stretch = %f, n_seg = %d, h = %f, side_len = %f, tol = %f\n", rho, k, initial_stretch, n_seg, h, side_len, tol);`
`7`	`7`	`FrictionSimulator<float, 2> simulator(rho, side_len, initial_stretch, k, h, tol, mu, n_seg);`
`8`	`8`	`simulator.run();`