#include "optimizer.hpp" #include #include #include #include #include #include #include #include "config.hpp" #include "field-math.hpp" #include "flow.hpp" #include "parametrizer.hpp" namespace qflow { #ifdef WITH_CUDA # include #endif #ifndef EIGEN_MPL2_ONLY template using LinearSolver = Eigen::SimplicialLLT; #else template using LinearSolver = Eigen::SparseLU; #endif Optimizer::Optimizer() {} void Optimizer::optimize_orientations(Hierarchy& mRes) { #ifdef WITH_CUDA optimize_orientations_cuda(mRes); printf("%s\n", cudaGetErrorString(cudaDeviceSynchronize())); cudaMemcpy(mRes.mQ[0].data(), mRes.cudaQ[0], sizeof(glm::dvec3) * mRes.mQ[0].cols(), cudaMemcpyDeviceToHost); #else int levelIterations = 6; for (int level = mRes.mN.size() - 1; level >= 0; --level) { AdjacentMatrix& adj = mRes.mAdj[level]; const MatrixXd& N = mRes.mN[level]; const MatrixXd& CQ = mRes.mCQ[level]; const VectorXd& CQw = mRes.mCQw[level]; MatrixXd& Q = mRes.mQ[level]; auto& phases = mRes.mPhases[level]; for (int iter = 0; iter < levelIterations; ++iter) { for (int phase = 0; phase < phases.size(); ++phase) { auto& p = phases[phase]; #ifdef WITH_OMP #pragma omp parallel for #endif for (int pi = 0; pi < p.size(); ++pi) { int i = p[pi]; const Vector3d n_i = N.col(i); double weight_sum = 0.0f; Vector3d sum = Q.col(i); for (auto& link : adj[i]) { const int j = link.id; const double weight = link.weight; if (weight == 0) continue; const Vector3d n_j = N.col(j); Vector3d q_j = Q.col(j); std::pair value = compat_orientation_extrinsic_4(sum, n_i, q_j, n_j); sum = value.first * weight_sum + value.second * weight; sum -= n_i * n_i.dot(sum); weight_sum += weight; double norm = sum.norm(); if (norm > RCPOVERFLOW) sum /= norm; } if (CQw.size() > 0) { float cw = CQw[i]; if (cw != 0) { std::pair value = compat_orientation_extrinsic_4(sum, n_i, CQ.col(i), n_i); sum = value.first * (1 - cw) + value.second * cw; sum -= n_i * n_i.dot(sum); float norm = sum.norm(); if (norm > RCPOVERFLOW) sum /= norm; } } if (weight_sum > 0) { Q.col(i) = sum; } } } } if (level > 0) { const MatrixXd& srcField = mRes.mQ[level]; const MatrixXi& toUpper = mRes.mToUpper[level - 1]; MatrixXd& destField = mRes.mQ[level - 1]; const MatrixXd& N = mRes.mN[level - 1]; #ifdef WITH_OMP #pragma omp parallel for #endif for (int i = 0; i < srcField.cols(); ++i) { for (int k = 0; k < 2; ++k) { int dest = toUpper(k, i); if (dest == -1) continue; Vector3d q = srcField.col(i), n = N.col(dest); destField.col(dest) = q - n * n.dot(q); } } } } for (int l = 0; l < mRes.mN.size() - 1; ++l) { const MatrixXd& N = mRes.mN[l]; const MatrixXd& N_next = mRes.mN[l + 1]; const MatrixXd& Q = mRes.mQ[l]; MatrixXd& Q_next = mRes.mQ[l + 1]; auto& toUpper = mRes.mToUpper[l]; #ifdef WITH_OMP #pragma omp parallel for #endif for (int i = 0; i < toUpper.cols(); ++i) { Vector2i upper = toUpper.col(i); Vector3d q0 = Q.col(upper[0]); Vector3d n0 = N.col(upper[0]); Vector3d q; if (upper[1] != -1) { Vector3d q1 = Q.col(upper[1]); Vector3d n1 = N.col(upper[1]); auto result = compat_orientation_extrinsic_4(q0, n0, q1, n1); q = result.first + result.second; } else { q = q0; } Vector3d n = N_next.col(i); q -= n.dot(q) * n; if (q.squaredNorm() > RCPOVERFLOW) q.normalize(); Q_next.col(i) = q; } } #endif } void Optimizer::optimize_scale(Hierarchy& mRes, VectorXd& rho, int adaptive) { const MatrixXd& N = mRes.mN[0]; MatrixXd& Q = mRes.mQ[0]; MatrixXd& V = mRes.mV[0]; MatrixXd& S = mRes.mS[0]; MatrixXd& K = mRes.mK[0]; MatrixXi& F = mRes.mF; if (adaptive) { std::vector> lhsTriplets; lhsTriplets.reserve(F.cols() * 6); for (int i = 0; i < V.cols(); ++i) { for (int j = 0; j < 2; ++j) { S(j, i) = 1.0; double sc1 = std::max(0.75 * S(j, i), rho[i] * 1.0 / mRes.mScale); S(j, i) = std::min(S(j, i), sc1); } } std::vector> entries(V.cols() * 2); double lambda = 1; for (int i = 0; i < entries.size(); ++i) { entries[i][i] = lambda; } for (int i = 0; i < F.cols(); ++i) { for (int j = 0; j < 3; ++j) { int v1 = F(j, i); int v2 = F((j + 1) % 3, i); Vector3d diff = V.col(v2) - V.col(v1); Vector3d q_1 = Q.col(v1); Vector3d q_2 = Q.col(v2); Vector3d n_1 = N.col(v1); Vector3d n_2 = N.col(v2); Vector3d q_1_y = n_1.cross(q_1); auto index = compat_orientation_extrinsic_index_4(q_1, n_1, q_2, n_2); int v1_x = v1 * 2, v1_y = v1 * 2 + 1, v2_x = v2 * 2, v2_y = v2 * 2 + 1; double dx = diff.dot(q_1); double dy = diff.dot(q_1_y); double kx_g = K(0, v1); double ky_g = K(1, v1); if (index.first % 2 != index.second % 2) { std::swap(v2_x, v2_y); } double scale_x = (fmin(fmax(1 + kx_g * dy, 0.3), 3)); double scale_y = (fmin(fmax(1 + ky_g * dx, 0.3), 3)); // (v2_x - scale_x * v1_x)^2 = 0 // x^2 - 2s xy + s^2 y^2 entries[v2_x][v2_x] += 1; entries[v1_x][v1_x] += scale_x * scale_x; entries[v2_y][v2_y] += 1; entries[v1_y][v1_y] += scale_y * scale_y; auto it = entries[v1_x].find(v2_x); if (it == entries[v1_x].end()) { entries[v1_x][v2_x] = -scale_x; entries[v2_x][v1_x] = -scale_x; entries[v1_y][v2_y] = -scale_y; entries[v2_y][v1_y] = -scale_y; } else { it->second -= scale_x; entries[v2_x][v1_x] -= scale_x; entries[v1_y][v2_y] -= scale_y; entries[v2_y][v1_y] -= scale_y; } } } Eigen::SparseMatrix A(V.cols() * 2, V.cols() * 2); VectorXd rhs(V.cols() * 2); rhs.setZero(); for (int i = 0; i < entries.size(); ++i) { rhs(i) = lambda * S(i % 2, i / 2); for (auto& rec : entries[i]) { lhsTriplets.push_back(Eigen::Triplet(i, rec.first, rec.second)); } } A.setFromTriplets(lhsTriplets.begin(), lhsTriplets.end()); LinearSolver> solver; solver.analyzePattern(A); solver.factorize(A); VectorXd result = solver.solve(rhs); double total_area = 0; for (int i = 0; i < V.cols(); ++i) { S(0, i) = (result(i * 2)); S(1, i) = (result(i * 2 + 1)); total_area += S(0, i) * S(1, i); } total_area = sqrt(V.cols() / total_area); for (int i = 0; i < V.cols(); ++i) { // S(0, i) *= total_area; // S(1, i) *= total_area; } } else { for (int i = 0; i < V.cols(); ++i) { S(0, i) = 1; S(1, i) = 1; } } for (int l = 0; l < mRes.mS.size() - 1; ++l) { const MatrixXd& S = mRes.mS[l]; MatrixXd& S_next = mRes.mS[l + 1]; auto& toUpper = mRes.mToUpper[l]; for (int i = 0; i < toUpper.cols(); ++i) { Vector2i upper = toUpper.col(i); Vector2d q0 = S.col(upper[0]); if (upper[1] != -1) { q0 = (q0 + S.col(upper[1])) * 0.5; } S_next.col(i) = q0; } } } void Optimizer::optimize_positions(Hierarchy& mRes, int with_scale) { int levelIterations = 6; #ifdef WITH_CUDA optimize_positions_cuda(mRes); cudaMemcpy(mRes.mO[0].data(), mRes.cudaO[0], sizeof(glm::dvec3) * mRes.mO[0].cols(), cudaMemcpyDeviceToHost); #else for (int level = mRes.mAdj.size() - 1; level >= 0; --level) { for (int iter = 0; iter < levelIterations; ++iter) { AdjacentMatrix& adj = mRes.mAdj[level]; const MatrixXd &N = mRes.mN[level], &Q = mRes.mQ[level], &V = mRes.mV[level]; const MatrixXd& CQ = mRes.mCQ[level]; const MatrixXd& CO = mRes.mCO[level]; const VectorXd& COw = mRes.mCOw[level]; MatrixXd& O = mRes.mO[level]; MatrixXd& S = mRes.mS[level]; auto& phases = mRes.mPhases[level]; for (int phase = 0; phase < phases.size(); ++phase) { auto& p = phases[phase]; #ifdef WITH_OMP #pragma omp parallel for #endif for (int pi = 0; pi < p.size(); ++pi) { int i = p[pi]; double scale_x = mRes.mScale; double scale_y = mRes.mScale; if (with_scale) { scale_x *= S(0, i); scale_y *= S(1, i); } double inv_scale_x = 1.0f / scale_x; double inv_scale_y = 1.0f / scale_y; const Vector3d n_i = N.col(i), v_i = V.col(i); Vector3d q_i = Q.col(i); Vector3d sum = O.col(i); double weight_sum = 0.0f; q_i.normalize(); for (auto& link : adj[i]) { const int j = link.id; const double weight = link.weight; if (weight == 0) continue; double scale_x_1 = mRes.mScale; double scale_y_1 = mRes.mScale; if (with_scale) { scale_x_1 *= S(0, j); scale_y_1 *= S(1, j); } double inv_scale_x_1 = 1.0f / scale_x_1; double inv_scale_y_1 = 1.0f / scale_y_1; const Vector3d n_j = N.col(j), v_j = V.col(j); Vector3d q_j = Q.col(j), o_j = O.col(j); q_j.normalize(); std::pair value = compat_position_extrinsic_4( v_i, n_i, q_i, sum, v_j, n_j, q_j, o_j, scale_x, scale_y, inv_scale_x, inv_scale_y, scale_x_1, scale_y_1, inv_scale_x_1, inv_scale_y_1); sum = value.first * weight_sum + value.second * weight; weight_sum += weight; if (weight_sum > RCPOVERFLOW) sum /= weight_sum; sum -= n_i.dot(sum - v_i) * n_i; } if (COw.size() > 0) { float cw = COw[i]; if (cw != 0) { Vector3d co = CO.col(i), cq = CQ.col(i); Vector3d d = co - sum; d -= cq.dot(d) * cq; sum += cw * d; sum -= n_i.dot(sum - v_i) * n_i; } } if (weight_sum > 0) { O.col(i) = position_round_4(sum, q_i, n_i, v_i, scale_x, scale_y, inv_scale_x, inv_scale_y); } } } } if (level > 0) { const MatrixXd& srcField = mRes.mO[level]; const MatrixXi& toUpper = mRes.mToUpper[level - 1]; MatrixXd& destField = mRes.mO[level - 1]; const MatrixXd& N = mRes.mN[level - 1]; const MatrixXd& V = mRes.mV[level - 1]; #ifdef WITH_OMP #pragma omp parallel for #endif for (int i = 0; i < srcField.cols(); ++i) { for (int k = 0; k < 2; ++k) { int dest = toUpper(k, i); if (dest == -1) continue; Vector3d o = srcField.col(i), n = N.col(dest), v = V.col(dest); o -= n * n.dot(o - v); destField.col(dest) = o; } } } } #endif } void Optimizer::optimize_positions_dynamic( MatrixXi& F, MatrixXd& V, MatrixXd& N, MatrixXd& Q, std::vector>& Vset, std::vector& O_compact, std::vector& F_compact, std::vector& V2E_compact, std::vector& E2E_compact, double mScale, std::vector& diffs, std::vector& diff_count, std::map, int>& o2e, std::vector& sharp_o, std::map>& compact_sharp_constraints, int with_scale) { std::set uncertain; for (auto& info : o2e) { if (diff_count[info.second] == 0) { uncertain.insert(info.first.first); uncertain.insert(info.first.second); } } std::vector Vind(O_compact.size(), -1); std::vector> links(O_compact.size()); std::vector> dedges(O_compact.size()); std::vector> adj(V.cols()); for (int i = 0; i < F.cols(); ++i) { for (int j = 0; j < 3; ++j) { int v1 = F(j, i); int v2 = F((j + 1) % 3, i); adj[v1].push_back(v2); } } auto FindNearest = [&]() { for (int i = 0; i < O_compact.size(); ++i) { if (Vind[i] == -1) { double min_dis = 1e30; int min_ind = -1; for (auto v : Vset[i]) { double dis = (V.col(v) - O_compact[i]).squaredNorm(); if (dis < min_dis) { min_dis = dis; min_ind = v; } } if (min_ind > -1) { Vind[i] = min_ind; double x = (O_compact[i] - V.col(min_ind)).dot(N.col(min_ind)); O_compact[i] -= x * N.col(min_ind); } } else { int current_v = Vind[i]; Vector3d n = N.col(current_v); double current_dis = (O_compact[i] - V.col(current_v)).squaredNorm(); while (true) { int next_v = -1; for (auto& v : adj[current_v]) { if (N.col(v).dot(n) < cos(10.0 / 180.0 * 3.141592654)) continue; double dis = (O_compact[i] - V.col(v)).squaredNorm(); if (dis < current_dis) { current_dis = dis; next_v = v; } } if (next_v == -1) break; // rotate ideal distance Vector3d n1 = N.col(current_v); Vector3d n2 = N.col(next_v); Vector3d axis = n1.cross(n2); double len = axis.norm(); double angle = atan2(len, n1.dot(n2)); axis.normalized(); Matrix3d m = AngleAxisd(angle, axis).toRotationMatrix(); for (auto e : dedges[i]) { Vector3d& d = diffs[e]; d = m * d; } current_v = next_v; } Vind[i] = current_v; } } }; auto BuildConnection = [&]() { for (int i = 0; i < links.size(); ++i) { int deid0 = V2E_compact[i]; if (deid0 != -1) { std::list& connection = links[i]; std::list& dedge = dedges[i]; int deid = deid0; do { connection.push_back(F_compact[deid / 4][(deid + 1) % 4]); dedge.push_back(deid); deid = E2E_compact[deid / 4 * 4 + (deid + 3) % 4]; } while (deid != -1 && deid != deid0); if (deid == -1) { deid = deid0; do { deid = E2E_compact[deid]; if (deid == -1) break; deid = deid / 4 * 4 + (deid + 1) % 4; connection.push_front(F_compact[deid / 4][(deid + 1) % 4]); dedge.push_front(deid); } while (true); } } } }; std::vector lines; auto ComputeDistance = [&]() { std::set unobserved; for (auto& info : o2e) { if (diff_count[info.second] == 0) { unobserved.insert(info.first.first); } } while (true) { bool update = false; std::set observed; for (auto& p : unobserved) { std::vector observations, edges; int count = 0; for (auto& e : dedges[p]) { edges.push_back(e); if (diff_count[e]) { count += 1; observations.push_back(1); } else { observations.push_back(0); } } if (count <= 1) continue; update = true; observed.insert(p); for (int i = 0; i < observations.size(); ++i) { if (observations[i] == 1) continue; int j = i; std::list interp; while (observations[j] == 0) { interp.push_front(j); j -= 1; if (j < 0) j = edges.size() - 1; } j = (i + 1) % edges.size(); while (observations[j] == 0) { interp.push_back(j); j += 1; if (j == edges.size()) j = 0; } Vector3d dl = diffs[edges[(interp.front() + edges.size() - 1) % edges.size()]]; double lenl = dl.norm(); Vector3d dr = diffs[edges[(interp.back() + 1) % edges.size()]]; double lenr = dr.norm(); dl /= lenl; dr /= lenr; Vector3d n = dl.cross(dr).normalized(); double angle = atan2(dl.cross(dr).norm(), dl.dot(dr)); if (angle < 0) angle += 2 * 3.141592654; Vector3d nc = N.col(Vind[p]); if (n.dot(nc) < 0) { n = -n; angle = 2 * 3.141592654 - angle; } double step = (lenr - lenl) / (interp.size() + 1); angle /= interp.size() + 1; Vector3d dlp = nc.cross(dl).normalized(); int t = 0; for (auto q : interp) { t += 1; observations[q] = 1; double ad = angle * t; int e = edges[q]; int re = E2E_compact[e]; diff_count[e] = 2; diffs[e] = (cos(ad) * dl + sin(ad) * dlp) * (lenl + step * t); if (re != -1) { diff_count[re] = 2; diffs[re] = -diffs[e]; } } for (int i = 0; i < edges.size(); ++i) { lines.push_back(O_compact[p]); lines.push_back(O_compact[p] + diffs[edges[i]]); } } } if (!update) break; for (auto& p : observed) unobserved.erase(p); } }; BuildConnection(); int max_iter = 10; for (int iter = 0; iter < max_iter; ++iter) { FindNearest(); ComputeDistance(); std::vector> entries(O_compact.size() * 2); std::vector fixed_dim(O_compact.size() * 2, 0); for (auto& info : compact_sharp_constraints) { fixed_dim[info.first * 2 + 1] = 1; if (info.second.second.norm() < 0.5) fixed_dim[info.first * 2] = 1; } std::vector b(O_compact.size() * 2); std::vector x(O_compact.size() * 2); std::vector Q_compact(O_compact.size()); std::vector N_compact(O_compact.size()); std::vector V_compact(O_compact.size()); #ifdef WITH_OMP #pragma omp parallel for #endif for (int i = 0; i < O_compact.size(); ++i) { Q_compact[i] = Q.col(Vind[i]); N_compact[i] = N.col(Vind[i]); V_compact[i] = V.col(Vind[i]); if (fixed_dim[i * 2 + 1] && !fixed_dim[i * 2]) { Q_compact[i] = compact_sharp_constraints[i].second; V_compact[i] = compact_sharp_constraints[i].first; } } for (int i = 0; i < O_compact.size(); ++i) { Vector3d q = Q_compact[i]; Vector3d n = N_compact[i]; Vector3d q_y = n.cross(q); auto Vi = V_compact[i]; x[i * 2] = (O_compact[i] - Vi).dot(q); x[i * 2 + 1] = (O_compact[i] - Vi).dot(q_y); } for (int i = 0; i < O_compact.size(); ++i) { Vector3d qx = Q_compact[i]; Vector3d qy = N_compact[i]; qy = qy.cross(qx); auto dedge_it = dedges[i].begin(); for (auto it = links[i].begin(); it != links[i].end(); ++it, ++dedge_it) { int j = *it; Vector3d qx2 = Q_compact[j]; Vector3d qy2 = N_compact[j]; qy2 = qy2.cross(qx2); int de = o2e[std::make_pair(i, j)]; double lambda = (diff_count[de] == 1) ? 1 : 1; Vector3d target_offset = diffs[de]; auto Vi = V_compact[i]; auto Vj = V_compact[j]; Vector3d offset = Vj - Vi; // target_offset.normalize(); // target_offset *= mScale; Vector3d C = target_offset - offset; int vid[] = {j * 2, j * 2 + 1, i * 2, i * 2 + 1}; Vector3d weights[] = {qx2, qy2, -qx, -qy}; for (int ii = 0; ii < 4; ++ii) { for (int jj = 0; jj < 4; ++jj) { auto it = entries[vid[ii]].find(vid[jj]); if (it == entries[vid[ii]].end()) { entries[vid[ii]][vid[jj]] = lambda * weights[ii].dot(weights[jj]); } else { entries[vid[ii]][vid[jj]] += lambda * weights[ii].dot(weights[jj]); } } b[vid[ii]] += lambda * weights[ii].dot(C); } } } // fix sharp edges for (int i = 0; i < entries.size(); ++i) { if (entries[i].size() == 0) { entries[i][i] = 1; b[i] = x[i]; } if (fixed_dim[i]) { b[i] = x[i]; entries[i].clear(); entries[i][i] = 1; } else { std::unordered_map newmap; for (auto& rec : entries[i]) { if (fixed_dim[rec.first]) { b[i] -= rec.second * x[rec.first]; } else { newmap[rec.first] = rec.second; } } std::swap(entries[i], newmap); } } std::vector> lhsTriplets; lhsTriplets.reserve(F_compact.size() * 8); Eigen::SparseMatrix A(O_compact.size() * 2, O_compact.size() * 2); VectorXd rhs(O_compact.size() * 2); rhs.setZero(); for (int i = 0; i < entries.size(); ++i) { rhs(i) = b[i]; for (auto& rec : entries[i]) { lhsTriplets.push_back(Eigen::Triplet(i, rec.first, rec.second)); } } A.setFromTriplets(lhsTriplets.begin(), lhsTriplets.end()); #ifdef LOG_OUTPUT int t1 = GetCurrentTime64(); #endif // FIXME: IncompleteCholesky Preconditioner will fail here so I fallback to Diagonal one. // I suspected either there is a implementation bug in IncompleteCholesky Preconditioner // or there is a memory corruption somewhere. However, g++'s address sanitizer does not // report anything useful. LinearSolver> solver; solver.analyzePattern(A); solver.factorize(A); // Eigen::setNbThreads(1); // ConjugateGradient, Lower | Upper> solver; // VectorXd x0 = VectorXd::Map(x.data(), x.size()); // solver.setMaxIterations(40); // solver.compute(A); VectorXd x_new = solver.solve(rhs); // solver.solveWithGuess(rhs, x0); #ifdef LOG_OUTPUT // std::cout << "[LSQ] n_iteration:" << solver.iterations() << std::endl; // std::cout << "[LSQ] estimated error:" << solver.error() << std::endl; int t2 = GetCurrentTime64(); printf("[LSQ] Linear solver uses %lf seconds.\n", (t2 - t1) * 1e-3); #endif for (int i = 0; i < O_compact.size(); ++i) { // Vector3d q = Q.col(Vind[i]); Vector3d q = Q_compact[i]; // Vector3d n = N.col(Vind[i]); Vector3d n = N_compact[i]; Vector3d q_y = n.cross(q); auto Vi = V_compact[i]; O_compact[i] = Vi + q * x_new[i * 2] + q_y * x_new[i * 2 + 1]; } // forgive my hack... if (iter + 1 == max_iter) { for (int iter = 0; iter < 5; ++iter) { for (int i = 0; i < O_compact.size(); ++i) { if (sharp_o[i]) continue; if (dedges[i].size() != 4 || uncertain.count(i)) { Vector3d n(0, 0, 0), v(0, 0, 0); Vector3d v0 = O_compact[i]; for (auto e : dedges[i]) { Vector3d v1 = O_compact[F_compact[e / 4][(e + 1) % 4]]; Vector3d v2 = O_compact[F_compact[e / 4][(e + 3) % 4]]; n += (v1 - v0).cross(v2 - v0); v += v1; } n.normalize(); Vector3d offset = v / dedges[i].size() - v0; offset -= offset.dot(n) * n; O_compact[i] += offset; } } } } } } void Optimizer::optimize_positions_sharp( Hierarchy& mRes, std::vector& edge_values, std::vector& edge_diff, std::vector& sharp_edges, std::set& sharp_vertices, std::map>& sharp_constraints, int with_scale) { auto& V = mRes.mV[0]; auto& F = mRes.mF; auto& Q = mRes.mQ[0]; auto& N = mRes.mN[0]; auto& O = mRes.mO[0]; auto& S = mRes.mS[0]; DisajointTree tree(V.cols()); for (int i = 0; i < edge_diff.size(); ++i) { if (edge_diff[i].array().abs().sum() == 0) { tree.Merge(edge_values[i].x, edge_values[i].y); } } tree.BuildCompactParent(); std::map compact_sharp_indices; std::set compact_sharp_edges; for (int i = 0; i < sharp_edges.size(); ++i) { if (sharp_edges[i] == 1) { int v1 = tree.Index(F(i % 3, i / 3)); int v2 = tree.Index(F((i + 1) % 3, i / 3)); compact_sharp_edges.insert(DEdge(v1, v2)); } } for (auto& v : sharp_vertices) { int p = tree.Index(v); if (compact_sharp_indices.count(p) == 0) { int s = compact_sharp_indices.size(); compact_sharp_indices[p] = s; } } std::map> sharp_vertices_links; std::set sharp_dedges; for (int i = 0; i < sharp_edges.size(); ++i) { if (sharp_edges[i]) { int v1 = F(i % 3, i / 3); int v2 = F((i + 1) % 3, i / 3); if (sharp_vertices_links.count(v1) == 0) sharp_vertices_links[v1] = std::set(); sharp_vertices_links[v1].insert(v2); sharp_dedges.insert(DEdge(v1, v2)); } } std::vector> sharp_to_original_indices(compact_sharp_indices.size()); for (auto& v : sharp_vertices_links) { if (v.second.size() == 2) continue; int p = tree.Index(v.first); sharp_to_original_indices[compact_sharp_indices[p]].push_back(v.first); } for (auto& v : sharp_vertices_links) { if (v.second.size() != 2) continue; int p = tree.Index(v.first); sharp_to_original_indices[compact_sharp_indices[p]].push_back(v.first); } for (int i = 0; i < V.cols(); ++i) { if (sharp_vertices.count(i)) continue; int p = tree.Index(i); if (compact_sharp_indices.count(p)) sharp_to_original_indices[compact_sharp_indices[p]].push_back(i); } int num = sharp_to_original_indices.size(); std::vector> links(sharp_to_original_indices.size()); for (int e = 0; e < edge_diff.size(); ++e) { int v1 = edge_values[e].x; int v2 = edge_values[e].y; int p1 = tree.Index(v1); int p2 = tree.Index(v2); if (p1 == p2 || compact_sharp_edges.count(DEdge(p1, p2)) == 0) continue; p1 = compact_sharp_indices[p1]; p2 = compact_sharp_indices[p2]; links[p1].insert(p2); links[p2].insert(p1); } std::vector hash(links.size(), 0); std::vector> loops; for (int i = 0; i < num; ++i) { if (hash[i] == 1) continue; if (links[i].size() == 2) { std::vector q; q.push_back(i); hash[i] = 1; int v = i; int prev_v = -1; bool is_loop = false; while (links[v].size() == 2) { int next_v = -1; for (auto nv : links[v]) if (nv != prev_v) next_v = nv; if (hash[next_v]) { is_loop = true; break; } if (links[next_v].size() == 2) hash[next_v] = true; q.push_back(next_v); prev_v = v; v = next_v; } if (!is_loop && q.size() >= 2) { std::vector q1; int v = i; int prev_v = q[1]; while (links[v].size() == 2) { int next_v = -1; for (auto nv : links[v]) if (nv != prev_v) next_v = nv; if (hash[next_v]) { is_loop = true; break; } if (links[next_v].size() == 2) hash[next_v] = true; q1.push_back(next_v); prev_v = v; v = next_v; } std::reverse(q1.begin(), q1.end()); q1.insert(q1.end(), q.begin(), q.end()); std::swap(q1, q); } if (q.size() < 3) continue; if (is_loop) q.push_back(q.front()); double len = 0, scale = 0; std::vector o(q.size()), new_o(q.size()); std::vector sc(q.size()); for (int i = 0; i < q.size() - 1; ++i) { int v1 = q[i]; int v2 = q[i + 1]; auto it = links[v1].find(v2); if (it == links[v1].end()) { printf("Non exist!\n"); exit(0); } } for (int i = 0; i < q.size(); ++i) { if (sharp_to_original_indices[q[i]].size() == 0) { continue; } o[i] = O.col(sharp_to_original_indices[q[i]][0]); Vector3d qx = Q.col(sharp_to_original_indices[q[i]][0]); Vector3d qy = Vector3d(N.col(sharp_to_original_indices[q[i]][0])).cross(qx); int fst = sharp_to_original_indices[q[1]][0]; Vector3d dis = (i == 0) ? (Vector3d(O.col(fst)) - o[i]) : o[i] - o[i - 1]; if (with_scale) sc[i] = (abs(qx.dot(dis)) > abs(qy.dot(dis))) ? S(0, sharp_to_original_indices[q[i]][0]) : S(1, sharp_to_original_indices[q[i]][0]); else sc[i] = 1; new_o[i] = o[i]; } if (is_loop) { for (int i = 0; i < q.size(); ++i) { Vector3d dir = (o[(i + 1) % q.size()] - o[(i + q.size() - 1) % q.size()]).normalized(); for (auto& ind : sharp_to_original_indices[q[i]]) { sharp_constraints[ind] = std::make_pair(o[i], dir); } } } else { for (int i = 0; i < q.size(); ++i) { Vector3d dir(0, 0, 0); if (i != 0 && i + 1 != q.size()) dir = (o[i + 1] - o[i - 1]).normalized(); else if (links[q[i]].size() == 1) { if (i == 0) dir = (o[i + 1] - o[i]).normalized(); else dir = (o[i] - o[i - 1]).normalized(); } for (auto& ind : sharp_to_original_indices[q[i]]) { sharp_constraints[ind] = std::make_pair(o[i], dir); } } } for (int i = 0; i < q.size() - 1; ++i) { len += (o[i + 1] - o[i]).norm(); scale += sc[i]; } int next_m = q.size() - 1; double left_norm = len * sc[0] / scale; int current_v = 0; double current_norm = (o[1] - o[0]).norm(); for (int i = 1; i < next_m; ++i) { while (left_norm >= current_norm) { left_norm -= current_norm; current_v += 1; current_norm = (o[current_v + 1] - o[current_v]).norm(); } new_o[i] = (o[current_v + 1] * left_norm + o[current_v] * (current_norm - left_norm)) / current_norm; o[current_v] = new_o[i]; current_norm -= left_norm; left_norm = len * sc[current_v] / scale; } for (int i = 0; i < q.size(); ++i) { for (auto v : sharp_to_original_indices[q[i]]) { O.col(v) = new_o[i]; } } loops.push_back(new_o); } } return; std::ofstream os("/Users/jingwei/Desktop/sharp.obj"); for (int i = 0; i < loops.size(); ++i) { for (auto& v : loops[i]) { os << "v " << v[0] << " " << v[1] << " " << v[2] << "\n"; } } int offset = 1; for (int i = 0; i < loops.size(); ++i) { for (int j = 0; j < loops[i].size() - 1; ++j) { os << "l " << offset + j << " " << offset + j + 1 << "\n"; } offset += loops[i].size(); } os.close(); exit(0); } void Optimizer::optimize_positions_fixed( Hierarchy& mRes, std::vector& edge_values, std::vector& edge_diff, std::set& sharp_vertices, std::map>& sharp_constraints, int with_scale) { auto& V = mRes.mV[0]; auto& F = mRes.mF; auto& Q = mRes.mQ[0]; auto& N = mRes.mN[0]; auto& O = mRes.mO[0]; auto& S = mRes.mS[0]; DisajointTree tree(V.cols()); for (int i = 0; i < edge_diff.size(); ++i) { if (edge_diff[i].array().abs().sum() == 0) { tree.Merge(edge_values[i].x, edge_values[i].y); } } tree.BuildCompactParent(); int num = tree.CompactNum(); // Find the most descriptive vertex std::vector v_positions(num, Vector3d(0, 0, 0)); std::vector v_count(num); std::vector v_distance(num, 1e30); std::vector v_index(num, -1); for (int i = 0; i < V.cols(); ++i) { v_positions[tree.Index(i)] += O.col(i); v_count[tree.Index(i)] += 1; } for (int i = 0; i < num; ++i) { if (v_count[i] > 0) v_positions[i] /= v_count[i]; } for (int i = 0; i < V.cols(); ++i) { int p = tree.Index(i); double dis = (v_positions[p] - V.col(i)).squaredNorm(); if (dis < v_distance[p]) { v_distance[p] = dis; v_index[p] = i; } } std::set compact_sharp_vertices; for (auto& v : sharp_vertices) { v_positions[tree.Index(v)] = O.col(v); v_index[tree.Index(v)] = v; V.col(v) = O.col(v); compact_sharp_vertices.insert(tree.Index(v)); } std::vector>> ideal_distances(tree.CompactNum()); for (int e = 0; e < edge_diff.size(); ++e) { int v1 = edge_values[e].x; int v2 = edge_values[e].y; int p1 = tree.Index(v1); int p2 = tree.Index(v2); int q1 = v_index[p1]; int q2 = v_index[p2]; Vector3d q_1 = Q.col(v1); Vector3d q_2 = Q.col(v2); Vector3d n_1 = N.col(v1); Vector3d n_2 = N.col(v2); Vector3d q_1_y = n_1.cross(q_1); Vector3d q_2_y = n_2.cross(q_2); auto index = compat_orientation_extrinsic_index_4(q_1, n_1, q_2, n_2); double s_x1 = S(0, v1), s_y1 = S(1, v1); double s_x2 = S(0, v2), s_y2 = S(1, v2); int rank_diff = (index.second + 4 - index.first) % 4; if (rank_diff % 2 == 1) std::swap(s_x2, s_y2); Vector3d qd_x = 0.5 * (rotate90_by(q_2, n_2, rank_diff) + q_1); Vector3d qd_y = 0.5 * (rotate90_by(q_2_y, n_2, rank_diff) + q_1_y); double scale_x = (with_scale ? 0.5 * (s_x1 + s_x2) : 1) * mRes.mScale; double scale_y = (with_scale ? 0.5 * (s_y1 + s_y2) : 1) * mRes.mScale; Vector2i diff = edge_diff[e]; Vector3d origin1 = /*(sharp_constraints.count(q1)) ? sharp_constraints[q1].first : */ V.col(q1); Vector3d origin2 = /*(sharp_constraints.count(q2)) ? sharp_constraints[q2].first : */ V.col(q2); Vector3d C = diff[0] * scale_x * qd_x + diff[1] * scale_y * qd_y + origin1 - origin2; auto it = ideal_distances[p1].find(p2); if (it == ideal_distances[p1].end()) { ideal_distances[p1][p2] = std::make_pair(1, C); } else { it->second.first += 1; it->second.second += C; } } std::vector> entries(num * 2); std::vector b(num * 2); for (int m = 0; m < num; ++m) { int v1 = v_index[m]; for (auto& info : ideal_distances[m]) { int v2 = v_index[info.first]; Vector3d q_1 = Q.col(v1); Vector3d q_2 = Q.col(v2); if (sharp_constraints.count(v1)) { Vector3d d = sharp_constraints[v1].second; if (d != Vector3d::Zero()) q_1 = d; } if (sharp_constraints.count(v2)) { Vector3d d = sharp_constraints[v2].second; if (d != Vector3d::Zero()) q_2 = d; } Vector3d n_1 = N.col(v1); Vector3d n_2 = N.col(v2); Vector3d q_1_y = n_1.cross(q_1); Vector3d q_2_y = n_2.cross(q_2); Vector3d weights[] = {q_2, q_2_y, -q_1, -q_1_y}; int vid[] = {info.first * 2, info.first * 2 + 1, m * 2, m * 2 + 1}; Vector3d dis = info.second.second / info.second.first; double lambda = 1; if (sharp_vertices.count(v1) && sharp_vertices.count(v2)) lambda = 1; for (int i = 0; i < 4; ++i) { for (int j = 0; j < 4; ++j) { auto it = entries[vid[i]].find(vid[j]); if (it == entries[vid[i]].end()) { entries[vid[i]][vid[j]] = weights[i].dot(weights[j]) * lambda; } else { entries[vid[i]][vid[j]] += weights[i].dot(weights[j]) * lambda; } } b[vid[i]] += weights[i].dot(dis) * lambda; } } } std::vector fixed_dim(num * 2, 0); std::vector x(num * 2); #ifdef WITH_OMP #pragma omp parallel for #endif for (int i = 0; i < num; ++i) { int p = v_index[i]; Vector3d q = Q.col(p); if (sharp_constraints.count(p)) { Vector3d dir = sharp_constraints[p].second; fixed_dim[i * 2 + 1] = 1; if (dir != Vector3d::Zero()) { q = dir; } else fixed_dim[i * 2] = 1; } Vector3d n = N.col(p); Vector3d q_y = n.cross(q); x[i * 2] = (v_positions[i] - V.col(p)).dot(q); x[i * 2 + 1] = (v_positions[i] - V.col(p)).dot(q_y); } // fix sharp edges for (int i = 0; i < entries.size(); ++i) { if (fixed_dim[i]) { b[i] = x[i]; entries[i].clear(); entries[i][i] = 1; } else { std::unordered_map newmap; for (auto& rec : entries[i]) { if (fixed_dim[rec.first]) { b[i] -= rec.second * x[rec.first]; } else { newmap[rec.first] = rec.second; } } std::swap(entries[i], newmap); } } for (int i = 0; i < entries.size(); ++i) { if (entries[i].size() == 0) { entries[i][i] = 1; } } std::vector> lhsTriplets; lhsTriplets.reserve(F.cols() * 6); Eigen::SparseMatrix A(num * 2, num * 2); VectorXd rhs(num * 2); rhs.setZero(); for (int i = 0; i < entries.size(); ++i) { rhs(i) = b[i]; if (std::isnan(b[i])) { printf("Equation has nan!\n"); exit(0); } for (auto& rec : entries[i]) { lhsTriplets.push_back(Eigen::Triplet(i, rec.first, rec.second)); if (std::isnan(rec.second)) { printf("Equation has nan!\n"); exit(0); } } } A.setFromTriplets(lhsTriplets.begin(), lhsTriplets.end()); #ifdef LOG_OUTPUT int t1 = GetCurrentTime64(); #endif /* Eigen::setNbThreads(1); ConjugateGradient, Lower | Upper> solver; VectorXd x0 = VectorXd::Map(x.data(), x.size()); solver.setMaxIterations(40); solver.compute(A); */ LinearSolver> solver; solver.analyzePattern(A); solver.factorize(A); VectorXd x_new = solver.solve(rhs); #ifdef LOG_OUTPUT // std::cout << "[LSQ] n_iteration:" << solver.iterations() << std::endl; // std::cout << "[LSQ] estimated error:" << solver.error() << std::endl; int t2 = GetCurrentTime64(); printf("[LSQ] Linear solver uses %lf seconds.\n", (t2 - t1) * 1e-3); #endif for (int i = 0; i < x.size(); ++i) { if (!std::isnan(x_new[i])) { if (!fixed_dim[i / 2 * 2 + 1]) { double total = 0; for (auto& res : entries[i]) { double t = x_new[res.first]; if (std::isnan(t)) t = 0; total += t * res.second; } } x[i] = x_new[i]; } } for (int i = 0; i < O.cols(); ++i) { int p = tree.Index(i); int c = v_index[p]; Vector3d q = Q.col(c); if (fixed_dim[p * 2 + 1]) { Vector3d dir = sharp_constraints[c].second; if (dir != Vector3d::Zero()) q = dir; } Vector3d n = N.col(c); Vector3d q_y = n.cross(q); O.col(i) = V.col(c) + q * x[p * 2] + q_y * x[p * 2 + 1]; } } void Optimizer::optimize_integer_constraints(Hierarchy& mRes, std::map& singularities, bool use_minimum_cost_flow) { int edge_capacity = 2; bool fullFlow = false; std::vector>& AllowChange = mRes.mAllowChanges; for (int level = mRes.mToUpperEdges.size(); level >= 0; --level) { auto& EdgeDiff = mRes.mEdgeDiff[level]; auto& FQ = mRes.mFQ[level]; auto& F2E = mRes.mF2E[level]; auto& E2F = mRes.mE2F[level]; int iter = 0; while (!fullFlow) { std::vector edge_to_constraints(E2F.size() * 2, Vector4i(-1, 0, -1, 0)); std::vector initial(F2E.size() * 2, 0); for (int i = 0; i < F2E.size(); ++i) { for (int j = 0; j < 3; ++j) { int e = F2E[i][j]; Vector2i index = rshift90(Vector2i(e * 2 + 1, e * 2 + 2), FQ[i][j]); for (int k = 0; k < 2; ++k) { int l = abs(index[k]); int s = index[k] / l; int ind = l - 1; int equationID = i * 2 + k; if (edge_to_constraints[ind][0] == -1) { edge_to_constraints[ind][0] = equationID; edge_to_constraints[ind][1] = s; } else { edge_to_constraints[ind][2] = equationID; edge_to_constraints[ind][3] = s; } initial[equationID] += s * EdgeDiff[ind / 2][ind % 2]; } } } std::vector> arcs; std::vector arc_ids; for (int i = 0; i < edge_to_constraints.size(); ++i) { if (AllowChange[level][i] == 0) continue; if (edge_to_constraints[i][0] == -1 || edge_to_constraints[i][2] == -1) continue; if (edge_to_constraints[i][1] == -edge_to_constraints[i][3]) { int v1 = edge_to_constraints[i][0]; int v2 = edge_to_constraints[i][2]; if (edge_to_constraints[i][1] < 0) std::swap(v1, v2); int current_v = EdgeDiff[i / 2][i % 2]; arcs.push_back(std::make_pair(Vector2i(v1, v2), current_v)); if (AllowChange[level][i] == 1) arc_ids.push_back(i + 1); else { arc_ids.push_back(-(i + 1)); } } } int supply = 0; int demand = 0; for (int i = 0; i < initial.size(); ++i) { int init_val = initial[i]; if (init_val > 0) { arcs.push_back(std::make_pair(Vector2i(-1, i), initial[i])); supply += init_val; } else if (init_val < 0) { demand -= init_val; arcs.push_back(std::make_pair(Vector2i(i, initial.size()), -init_val)); } } std::unique_ptr solver = nullptr; if (use_minimum_cost_flow && level == mRes.mToUpperEdges.size()) { lprintf("network simplex MCF is used\n"); solver = std::make_unique(); } else if (supply < 20) { solver = std::make_unique(); } else { solver = std::make_unique(); } #ifdef WITH_GUROBI if (use_minimum_cost_flow && level == mRes.mToUpperEdges.size()) { solver = std::make_unique(); } #endif solver->resize(initial.size() + 2, arc_ids.size()); std::set ids; for (int i = 0; i < arcs.size(); ++i) { int v1 = arcs[i].first[0] + 1; int v2 = arcs[i].first[1] + 1; int c = arcs[i].second; if (v1 == 0 || v2 == initial.size() + 1) { solver->addEdge(v1, v2, c, 0, -1); } else { if (arc_ids[i] > 0) solver->addEdge(v1, v2, std::max(0, c + edge_capacity), std::max(0, -c + edge_capacity), arc_ids[i] - 1); else { if (c > 0) solver->addEdge(v1, v2, std::max(0, c - 1), std::max(0, -c + edge_capacity), -1 - arc_ids[i]); else solver->addEdge(v1, v2, std::max(0, c + edge_capacity), std::max(0, -c - 1), -1 - arc_ids[i]); } } } int flow_count = solver->compute(); solver->applyTo(EdgeDiff); lprintf("flow_count = %d, supply = %d\n", flow_count, supply); if (flow_count == supply) fullFlow = true; if (level != 0 || fullFlow) break; edge_capacity += 1; iter++; if (iter == 10) { /* Probably won't converge. */ break; } lprintf("Not full flow, edge_capacity += 1\n"); } if (level != 0) { auto& nEdgeDiff = mRes.mEdgeDiff[level - 1]; auto& toUpper = mRes.mToUpperEdges[level - 1]; auto& toUpperOrients = mRes.mToUpperOrients[level - 1]; for (int i = 0; i < toUpper.size(); ++i) { if (toUpper[i] >= 0) { int orient = (4 - toUpperOrients[i]) % 4; nEdgeDiff[i] = rshift90(EdgeDiff[toUpper[i]], orient); } } } } } #ifdef WITH_CUDA void Optimizer::optimize_orientations_cuda(Hierarchy& mRes) { int levelIterations = 6; for (int level = mRes.mN.size() - 1; level >= 0; --level) { Link* adj = mRes.cudaAdj[level]; int* adjOffset = mRes.cudaAdjOffset[level]; glm::dvec3* N = mRes.cudaN[level]; glm::dvec3* Q = mRes.cudaQ[level]; auto& phases = mRes.cudaPhases[level]; for (int iter = 0; iter < levelIterations; ++iter) { for (int phase = 0; phase < phases.size(); ++phase) { int* p = phases[phase]; UpdateOrientation(p, mRes.mPhases[level][phase].size(), N, Q, adj, adjOffset, mRes.mAdj[level][phase].size()); } } if (level > 0) { glm::dvec3* srcField = mRes.cudaQ[level]; glm::ivec2* toUpper = mRes.cudaToUpper[level - 1]; glm::dvec3* destField = mRes.cudaQ[level - 1]; glm::dvec3* N = mRes.cudaN[level - 1]; PropagateOrientationUpper(srcField, mRes.mQ[level].cols(), toUpper, N, destField); } } for (int l = 0; l < mRes.mN.size() - 1; ++l) { glm::dvec3* N = mRes.cudaN[l]; glm::dvec3* N_next = mRes.cudaN[l + 1]; glm::dvec3* Q = mRes.cudaQ[l]; glm::dvec3* Q_next = mRes.cudaQ[l + 1]; glm::ivec2* toUpper = mRes.cudaToUpper[l]; PropagateOrientationLower(toUpper, Q, N, Q_next, N_next, mRes.mToUpper[l].cols()); } } void Optimizer::optimize_positions_cuda(Hierarchy& mRes) { int levelIterations = 6; for (int level = mRes.mAdj.size() - 1; level >= 0; --level) { Link* adj = mRes.cudaAdj[level]; int* adjOffset = mRes.cudaAdjOffset[level]; glm::dvec3* N = mRes.cudaN[level]; glm::dvec3* Q = mRes.cudaQ[level]; glm::dvec3* V = mRes.cudaV[level]; glm::dvec3* O = mRes.cudaO[level]; std::vector phases = mRes.cudaPhases[level]; for (int iter = 0; iter < levelIterations; ++iter) { for (int phase = 0; phase < phases.size(); ++phase) { int* p = phases[phase]; UpdatePosition(p, mRes.mPhases[level][phase].size(), N, Q, adj, adjOffset, mRes.mAdj[level][phase].size(), V, O, mRes.mScale); } } if (level > 0) { glm::dvec3* srcField = mRes.cudaO[level]; glm::ivec2* toUpper = mRes.cudaToUpper[level - 1]; glm::dvec3* destField = mRes.cudaO[level - 1]; glm::dvec3* N = mRes.cudaN[level - 1]; glm::dvec3* V = mRes.cudaV[level - 1]; PropagatePositionUpper(srcField, mRes.mO[level].cols(), toUpper, N, V, destField); } } } #endif } // namespace qflow