eos/doc/linear__shape__fitting_8hpp_source.html

/*

 * eos - A 3D Morphable Model fitting library written in modern C++11/14.

 *

 * File: include/eos/fitting/linear_shape_fitting.hpp

 *

 * Copyright 2014, 2015 Patrik Huber

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */

#pragma once


#ifndef EOS_LINEAR_SHAPE_FITTING_HPP

#define EOS_LINEAR_SHAPE_FITTING_HPP


#include "eos/morphablemodel/PcaModel.hpp"

#include "eos/cpp17/optional.hpp"


#include "Eigen/Core"

#include "Eigen/QR"

#include "Eigen/Sparse"


#include <vector>

#include <cstdint>

#include <cassert>


namespace eos {

namespace fitting {


inline std::vector<float> fit_shape_to_landmarks_linear(

    const morphablemodel::PcaModel& shape_model, Eigen::Matrix<float, 3, 4> affine_camera_matrix,

    const std::vector<Eigen::Vector2f>& landmarks, const std::vector<int>& vertex_ids,

    Eigen::VectorXf base_face = Eigen::VectorXf(), float lambda = 3.0f,

    cpp17::optional<int> num_coefficients_to_fit = cpp17::optional<int>(),

    cpp17::optional<float> detector_standard_deviation = cpp17::optional<float>(),

    cpp17::optional<float> model_standard_deviation = cpp17::optional<float>())

{

    assert(landmarks.size() == vertex_ids.size());


    using Eigen::VectorXf;

    using Eigen::MatrixXf;


    const int num_coeffs_to_fit = num_coefficients_to_fit.value_or(shape_model.get_num_principal_components());

    const int num_landmarks = static_cast<int>(landmarks.size());


    if (base_face.size() == 0)

    {

        base_face = shape_model.get_mean();

    }


    // $\hat{V} \in R^{3N\times m-1}$, subselect the rows of the eigenvector matrix $V$ associated with the $N$ feature points

    // And we insert a row of zeros after every third row, resulting in matrix $\hat{V}_h \in R^{4N\times m-1}$:

    MatrixXf V_hat_h = MatrixXf::Zero(4 * num_landmarks, num_coeffs_to_fit);

    int row_index = 0;

    for (int i = 0; i < num_landmarks; ++i)

    {

        // In the paper, I'm not sure whether they use the orthonormal basis. It seems a bit messy/inconsistent even in the paper.

        // Update PH 26.5.2014: I think the rescaled basis is fine/better!

        const auto& basis_rows = shape_model.get_rescaled_pca_basis_at_point(vertex_ids[i]);

        V_hat_h.block(row_index, 0, 3, V_hat_h.cols()) =

            basis_rows.block(0, 0, basis_rows.rows(), num_coeffs_to_fit);

        row_index += 4; // replace 3 rows and skip the 4th one, it has all zeros

    }


    // Form a block diagonal matrix $P \in R^{3N\times 4N}$ in which the camera matrix C (P_Affine, affine_camera_matrix) is placed on the diagonal:

    Eigen::SparseMatrix<float> P(3 * num_landmarks, 4 * num_landmarks);

    std::vector<Eigen::Triplet<float>> P_coefficients; // list of non-zeros coefficients

    for (int i = 0; i < num_landmarks; ++i) { // Note: could make this the inner-most loop.

        for (int x = 0; x < affine_camera_matrix.rows(); ++x) {

            for (int y = 0; y < affine_camera_matrix.cols(); ++y) {

                P_coefficients.push_back(

                    Eigen::Triplet<float>(3 * i + x, 4 * i + y, affine_camera_matrix(x, y)));

            }

        }

    }

    P.setFromTriplets(P_coefficients.begin(), P_coefficients.end());


    // The variances: Add the 2D and 3D standard deviations.

    // If the user doesn't provide them, we choose the following:

    // 2D (detector) standard deviation: In pixel, we follow [1] and choose sqrt(3) as the default value.

    // 3D (model) variance: 0.0f. It only makes sense to set it to something when we have a different variance

    // for different vertices.

    // The 3D variance has to be projected to 2D (for details, see paper [1]) so the units do match up.

    const float sigma_squared_2D = std::pow(detector_standard_deviation.value_or(std::sqrt(3.0f)), 2) +

                                   std::pow(model_standard_deviation.value_or(0.0f), 2);

    // We use a VectorXf, and later use .asDiagonal():

    const VectorXf Omega = VectorXf::Constant(3 * num_landmarks, 1.0f / sigma_squared_2D);

    // Earlier, we set Sigma in a for-loop and then computed Omega, but it was really unnecessary:

    // Sigma(i, i) = sqrt(sigma_squared_2D), but then Omega is Sigma.t() * Sigma (squares the diagonal) - so

    // we just assign 1/sigma_squared_2D to Omega here.


    // The landmarks in matrix notation (in homogeneous coordinates), $3N\times 1$

    VectorXf y = VectorXf::Ones(3 * num_landmarks);

    for (int i = 0; i < num_landmarks; ++i)

    {

        y(3 * i) = landmarks[i][0];

        y((3 * i) + 1) = landmarks[i][1];

        // y((3 * i) + 2) = 1; // already 1, stays (homogeneous coordinate)

    }


    // The mean, with an added homogeneous coordinate (x_1, y_1, z_1, 1, x_2, ...)^t

    VectorXf v_bar = VectorXf::Ones(4 * num_landmarks);

    for (int i = 0; i < num_landmarks; ++i)

    {

        v_bar(4 * i) = base_face(vertex_ids[i] * 3);

        v_bar((4 * i) + 1) = base_face(vertex_ids[i] * 3 + 1);

        v_bar((4 * i) + 2) = base_face(vertex_ids[i] * 3 + 2);

        // v_bar((4 * i) + 3) = 1; // already 1, stays (homogeneous coordinate)

    }


    // Bring into standard regularised quadratic form with diagonal distance matrix Omega:

    const MatrixXf A = P * V_hat_h; // camera matrix times the basis

    const MatrixXf b = P * v_bar - y; // camera matrix times the mean, minus the landmarks

    const MatrixXf AtOmegaAReg = A.transpose() * Omega.asDiagonal() * A +

                                 lambda * Eigen::MatrixXf::Identity(num_coeffs_to_fit, num_coeffs_to_fit);

    const MatrixXf rhs = -A.transpose() * Omega.asDiagonal() * b; // It's -A^t*Omega^t*b, but we don't need to

                                                                  // transpose Omega, since it's a diagonal

                                                                  // matrix, and Omega^t = Omega.


    // c_s: The 'x' that we solve for. (The variance-normalised shape parameter vector, $c_s =

    // [a_1/sigma_{s,1} , ..., a_m-1/sigma_{s,m-1}]^t$.)

    // We get coefficients ~ N(0, 1), because we're fitting with the rescaled basis. The coefficients are not

    // multiplied with their eigenvalues.

    const VectorXf c_s = AtOmegaAReg.colPivHouseholderQr().solve(rhs);


    return std::vector<float>(c_s.data(), c_s.data() + c_s.size());

};


inline std::vector<float>

fit_shape_to_landmarks_linear_multi(const morphablemodel::PcaModel& shape_model,

                                    const std::vector<Eigen::Matrix<float, 3, 4>>& affine_camera_matrices,

                                    const std::vector<std::vector<Eigen::Vector2f>>& landmarks,

                                    const std::vector<std::vector<int>>& vertex_ids,

                                    std::vector<Eigen::VectorXf> base_faces = std::vector<Eigen::VectorXf>(),

                                    float lambda = 3.0f,

                                    cpp17::optional<int> num_coefficients_to_fit = cpp17::optional<int>(),

                                    cpp17::optional<float> detector_standard_deviation = cpp17::optional<float>(),

                                    cpp17::optional<float> model_standard_deviation = cpp17::optional<float>())

{

    assert(affine_camera_matrices.size() == landmarks.size() &&

           landmarks.size() == vertex_ids.size()); // same number of instances (i.e. images/frames) for each of them

    const int num_images = static_cast<int>(affine_camera_matrices.size());

    for (int j = 0; j < num_images; ++j) {

        assert(landmarks[j].size() == vertex_ids[j].size());

    }


    using Eigen::VectorXf;

    using Eigen::MatrixXf;


    const int num_coeffs_to_fit = num_coefficients_to_fit.value_or(shape_model.get_num_principal_components());


    // the regularisation has to be adjusted when more than one image is given

    lambda *= num_images;


    std::size_t total_num_landmarks_dimension = 0;

    for (const auto& l : landmarks) {

        total_num_landmarks_dimension += l.size();

    }


    // $\hat{V} \in R^{3N\times m-1}$, subselect the rows of the eigenvector matrix $V$ associated with the $N$ feature points

    // And we insert a row of zeros after every third row, resulting in matrix $\hat{V}_h \in R^{4N\times m-1}$:

    MatrixXf V_hat_h = MatrixXf::Zero(4 * total_num_landmarks_dimension, num_coeffs_to_fit);

    int V_hat_h_row_index = 0;

    // Form a block diagonal matrix $P \in R^{3N\times 4N}$ in which the camera matrix C (P_Affine, affine_camera_matrix) is placed on the diagonal:

    Eigen::SparseMatrix<float> P(3 * total_num_landmarks_dimension, 4 * total_num_landmarks_dimension);

    std::vector<Eigen::Triplet<float>> P_coefficients; // list of non-zeros coefficients

    int P_index = 0;

    // The variances: Add the 2D and 3D standard deviations.

    // If the user doesn't provide them, we choose the following:

    // 2D (detector) standard deviation: In pixel, we follow [1] and choose sqrt(3) as the default value.

    // 3D (model) variance: 0.0f. It only makes sense to set it to something when we have a different variance for different vertices.

    // The 3D variance has to be projected to 2D (for details, see paper [1]) so the units do match up.

    const float sigma_squared_2D = std::pow(detector_standard_deviation.value_or(std::sqrt(3.0f)), 2) +

                                   std::pow(model_standard_deviation.value_or(0.0f), 2);

    // We use a VectorXf, and later use .asDiagonal():

    const VectorXf Omega = VectorXf::Constant(3 * total_num_landmarks_dimension, 1.0f / sigma_squared_2D);

    // The landmarks in matrix notation (in homogeneous coordinates), $3N\times 1$

    VectorXf y = VectorXf::Ones(3 * total_num_landmarks_dimension);

    int y_index = 0; // also runs the same as P_index. Should rename to "running_index"?

    // The mean, with an added homogeneous coordinate (x_1, y_1, z_1, 1, x_2, ...)^t

    VectorXf v_bar = VectorXf::Ones(4 * total_num_landmarks_dimension);

    int v_bar_index = 0; // also runs the same as P_index. But be careful, if I change it to be only 1 variable, only increment it once! :-)

                         // Well I think that would make it a bit messy since we need to increment inside the for (landmarks...) loop. Try to refactor some other way.


    for (int k = 0; k < num_images; ++k)

    {

        // For each image we have, set up the equations and add it to the matrices:

        assert(landmarks[k].size() == vertex_ids[k].size()); // has to be valid for each img


        const int num_landmarks = static_cast<int>(landmarks[k].size());


        if (base_faces[k].size() == 0)

        {

            base_faces[k] = shape_model.get_mean();

        }


        // $\hat{V} \in R^{3N\times m-1}$, subselect the rows of the eigenvector matrix $V$ associated with the $N$ feature points

        // And we insert a row of zeros after every third row, resulting in matrix $\hat{V}_h \in R^{4N\times m-1}$:

        //Mat V_hat_h = Mat::zeros(4 * num_landmarks, num_coeffs_to_fit, CV_32FC1);

        for (int i = 0; i < num_landmarks; ++i)

        {

            const MatrixXf basis_rows_ = shape_model.get_rescaled_pca_basis_at_point(

                vertex_ids[k][i]); // In the paper, the orthonormal basis might be used? I'm not sure, check it.

                                   // It's even a mess in the paper. PH 26.5.2014: I think the rescaled basis is fine/better.

            V_hat_h.block(V_hat_h_row_index, 0, 3, V_hat_h.cols()) =

                basis_rows_.block(0, 0, basis_rows_.rows(), num_coeffs_to_fit);

            V_hat_h_row_index += 4; // replace 3 rows and skip the 4th one, it has all zeros

        }


        // Form a block diagonal matrix $P \in R^{3N\times 4N}$ in which the camera matrix C (P_Affine, affine_camera_matrix) is placed on the diagonal:

        for (int i = 0; i < num_landmarks; ++i) {

            for (int x = 0; x < affine_camera_matrices[k].rows(); ++x) {

                for (int y = 0; y < affine_camera_matrices[k].cols(); ++y) {

                    P_coefficients.push_back(Eigen::Triplet<float>(3 * P_index + x, 4 * P_index + y,

                                                                   affine_camera_matrices[k](x, y)));

                }

            }

            ++P_index;

        }

        // Fill P with coefficients:

        P.setFromTriplets(P_coefficients.begin(), P_coefficients.end());


        // The landmarks in matrix notation (in homogeneous coordinates), $3N\times 1$

        //Mat y = Mat::ones(3 * num_landmarks, 1, CV_32FC1);

        for (int i = 0; i < num_landmarks; ++i) {

            y(3 * y_index) = landmarks[k][i][0];

            y((3 * y_index) + 1) = landmarks[k][i][1];

            //y((3 * i) + 2) = 1; // already 1, stays (homogeneous coordinate)

            ++y_index;

        }

        // The mean, with an added homogeneous coordinate (x_1, y_1, z_1, 1, x_2, ...)^t

        //Mat v_bar = Mat::ones(4 * num_landmarks, 1, CV_32FC1);

        for (int i = 0; i < num_landmarks; ++i) {

            v_bar(4 * v_bar_index) = base_faces[k](vertex_ids[k][i] * 3);

            v_bar((4 * v_bar_index) + 1) = base_faces[k](vertex_ids[k][i] * 3 + 1);

            v_bar((4 * v_bar_index) + 2) = base_faces[k](vertex_ids[k][i] * 3 + 2);

            //v_bar.at<float>((4 * i) + 3) = 1; // already 1, stays (homogeneous coordinate)

            ++v_bar_index;

        }

    }


    // Bring into standard regularised quadratic form with diagonal distance matrix Omega:

    const MatrixXf A = P * V_hat_h; // camera matrix times the basis

    const MatrixXf b = P * v_bar - y; // camera matrix times the mean, minus the landmarks

    const MatrixXf AtOmegaAReg = A.transpose() * Omega.asDiagonal() * A +

                                 lambda * Eigen::MatrixXf::Identity(num_coeffs_to_fit, num_coeffs_to_fit);

    const MatrixXf rhs = -A.transpose() * Omega.asDiagonal() * b; // It's -A^t*Omega^t*b, but we don't need to transpose Omega, since it's a diagonal matrix, and Omega^t = Omega.


    // c_s: The 'x' that we solve for. (The variance-normalised shape parameter vector, $c_s = [a_1/sigma_{s,1} , ..., a_m-1/sigma_{s,m-1}]^t$.)

    // We get coefficients ~ N(0, 1), because we're fitting with the rescaled basis. The coefficients are not multiplied with their eigenvalues.

    const VectorXf c_s = AtOmegaAReg.colPivHouseholderQr().solve(rhs);


    return std::vector<float>(c_s.data(), c_s.data() + c_s.size());

};


} /* namespace fitting */

} /* namespace eos */


#endif /* EOS_LINEAR_SHAPE_FITTING_HPP */

eos::morphablemodel::PcaModel
This class represents a PCA-model that consists of:
Definition: PcaModel.hpp:59

eos::morphablemodel::PcaModel::get_num_principal_components
int get_num_principal_components() const
Definition: PcaModel.hpp:88

eos::morphablemodel::PcaModel::get_rescaled_pca_basis_at_point
Eigen::MatrixXf get_rescaled_pca_basis_at_point(int vertex_id) const
Definition: PcaModel.hpp:223

eos::morphablemodel::PcaModel::get_mean
const Eigen::VectorXf & get_mean() const
Definition: PcaModel.hpp:123

eos::fitting::fit_shape_to_landmarks_linear_multi
std::vector< float > fit_shape_to_landmarks_linear_multi(const morphablemodel::PcaModel &shape_model, const std::vector< Eigen::Matrix< float, 3, 4 > > &affine_camera_matrices, const std::vector< std::vector< Eigen::Vector2f > > &landmarks, const std::vector< std::vector< int > > &vertex_ids, std::vector< Eigen::VectorXf > base_faces=std::vector< Eigen::VectorXf >(), float lambda=3.0f, cpp17::optional< int > num_coefficients_to_fit=cpp17::optional< int >(), cpp17::optional< float > detector_standard_deviation=cpp17::optional< float >(), cpp17::optional< float > model_standard_deviation=cpp17::optional< float >())
Definition: linear_shape_fitting.hpp:178

eos::fitting::fit_shape_to_landmarks_linear
std::vector< float > fit_shape_to_landmarks_linear(const morphablemodel::PcaModel &shape_model, Eigen::Matrix< float, 3, 4 > affine_camera_matrix, const std::vector< Eigen::Vector2f > &landmarks, const std::vector< int > &vertex_ids, Eigen::VectorXf base_face=Eigen::VectorXf(), float lambda=3.0f, cpp17::optional< int > num_coefficients_to_fit=cpp17::optional< int >(), cpp17::optional< float > detector_standard_deviation=cpp17::optional< float >(), cpp17::optional< float > model_standard_deviation=cpp17::optional< float >())
Definition: linear_shape_fitting.hpp:60

eos
Namespace containing all of eos's 3D model fitting functionality.