mpp.hpp
Go to the documentation of this file.
1 /*
2 Copyright (c) 2015-2019, Florian Sittel (www.lettis.net) and Daniel Nagel
3 All rights reserved.
4 
5 Redistribution and use in source and binary forms, with or without
6 modification, are permitted provided that the following conditions are met:
7 
8 1. Redistributions of source code must retain the above copyright notice, this
9 list of conditions and the following disclaimer.
10 
11 2. Redistributions in binary form must reproduce the above copyright notice,
12 this list of conditions and the following disclaimer in the documentation
13 and/or other materials provided with the distribution.
14 
15 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
16 ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
19 FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
22 CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
23 OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
24 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25 */
26 #pragma once
27 
28 #include <vector>
29 #include <map>
30 #include <set>
31 #include <stdexcept>
32 #include <string>
33 
34 #include <boost/program_options.hpp>
35 #include <boost/numeric/ublas/matrix_sparse.hpp>
36 #include <boost/numeric/ublas/io.hpp>
37 
38 #include "tools.hpp"
45 namespace Clustering {
57  namespace MPP {
59  using SparseMatrixF = boost::numeric::ublas::mapped_matrix<float>;
64  read_transition_probabilities(std::string fname);
68  transition_counts(std::vector<std::size_t> trajectory
69  , std::vector<std::size_t> concat_limits
70  , std::size_t n_lag_steps
71  , std::size_t i_max = 0);
75  weighted_transition_counts(std::vector<std::size_t> trajectory
76  , std::vector<std::size_t> concat_limits
77  , std::size_t n_lag_steps);
81  , std::set<std::size_t> microstate_names);
85  , std::map<std::size_t, std::size_t> sinks
86  , std::map<std::size_t, std::size_t> pops);
89  std::map<std::size_t, std::size_t>
90  single_step_future_state(SparseMatrixF transition_matrix,
91  std::set<std::size_t> cluster_names,
92  float q_min,
93  std::map<std::size_t, float> min_free_energy);
96  std::map<std::size_t, std::vector<std::size_t>>
97  most_probable_path(std::map<std::size_t, std::size_t> future_state, std::set<std::size_t> cluster_names);
99  std::map<std::size_t, std::size_t>
100  microstate_populations(std::vector<std::size_t> clusters, std::set<std::size_t> cluster_names);
103  std::map<std::size_t, float>
104  microstate_min_free_energy(const std::vector<std::size_t>& clustering,
105  const std::vector<float>& free_energy);
109  std::map<std::size_t, std::size_t>
110  path_sinks(std::vector<std::size_t> clusters,
111  std::map<std::size_t, std::vector<std::size_t>> mpp,
112  SparseMatrixF transition_matrix,
113  std::set<std::size_t> cluster_names,
114  float q_min,
115  std::vector<float> free_energy);
118  std::vector<std::size_t>
119  lumped_trajectory(std::vector<std::size_t> trajectory,
120  std::map<std::size_t, std::size_t> sinks);
122  std::tuple<std::vector<std::size_t>
123  , std::map<std::size_t, std::size_t>
124  , SparseMatrixF>
125  fixed_metastability_clustering(std::vector<std::size_t> initial_trajectory,
126  SparseMatrixF trans_prob,
127  float q_min,
128  std::vector<float> free_energy);
144  void
145  main(boost::program_options::variables_map args);
146  } // end namespace Clustering::MPP
147 } // end namespace Clustering
148 
boost::numeric::ublas::mapped_matrix< float > SparseMatrixF
BOOST implementation of a sparse matrix for floats.
Definition: mpp.hpp:59
SparseMatrixF read_transition_probabilities(std::string fname)
read (row-normalized) transition matrix from file
Definition: mpp.cpp:38
SparseMatrixF row_normalized_transition_probabilities(SparseMatrixF count_matrix, std::set< std::size_t > cluster_names)
compute transition matrix from counts by normalization of rows
Definition: mpp.cpp:159
general namespace for clustering package
Definition: coring.cpp:38
Tools mainly for IO and some other functions.
std::map< std::size_t, std::size_t > microstate_populations(std::vector< std::size_t > clusters, std::set< std::size_t > cluster_names)
compute cluster populations
Definition: mpp.cpp:308
std::map< std::size_t, float > microstate_min_free_energy(const std::vector< std::size_t > &clustering, const std::vector< float > &free_energy)
Definition: mpp.cpp:320
std::map< std::size_t, std::vector< std::size_t > > most_probable_path(std::map< std::size_t, std::size_t > future_state, std::set< std::size_t > cluster_names)
Definition: mpp.cpp:288
std::map< std::size_t, std::size_t > path_sinks(std::vector< std::size_t > clusters, std::map< std::size_t, std::vector< std::size_t >> mpp, SparseMatrixF transition_matrix, std::set< std::size_t > cluster_names, float q_min, std::vector< float > free_energy)
Definition: mpp.cpp:337
std::map< std::size_t, Clustering::Tools::Neighbor > Neighborhood
map frame id to neighbors
Definition: tools.hpp:66
SparseMatrixF updated_transition_probabilities(SparseMatrixF transition_matrix, std::map< std::size_t, std::size_t > sinks, std::map< std::size_t, std::size_t > pops)
update transition matrix after lumping states into sinks
Definition: mpp.cpp:181
Clustering::Tools::Neighborhood Neighborhood
Neighborhood per frame.
Definition: mpp.hpp:61
std::map< std::size_t, std::size_t > single_step_future_state(SparseMatrixF transition_matrix, std::set< std::size_t > cluster_names, float q_min, std::map< std::size_t, float > min_free_energy)
Definition: mpp.cpp:234
SparseMatrixF weighted_transition_counts(std::vector< std::size_t > trajectory, std::vector< std::size_t > concat_limits, std::size_t n_lag_steps)
Definition: mpp.cpp:113
std::vector< std::size_t > lumped_trajectory(std::vector< std::size_t > trajectory, std::map< std::size_t, std::size_t > sinks)
Definition: mpp.cpp:400
SparseMatrixF transition_counts(std::vector< std::size_t > trajectory, std::vector< std::size_t > concat_limits, std::size_t n_lag_steps, std::size_t i_max)
Definition: mpp.cpp:78
void main(boost::program_options::variables_map args)
MPP clustering control function and user interface.
Definition: mpp.cpp:487
std::tuple< std::vector< std::size_t >, std::map< std::size_t, std::size_t >, SparseMatrixF > fixed_metastability_clustering(std::vector< std::size_t > initial_trajectory, SparseMatrixF trans_prob, float q_min, std::vector< float > free_energy)
run clustering for given Q_min value
Definition: mpp.cpp:413