tools.hpp
Go to the documentation of this file.
1 /*
2 Copyright (c) 2015-2019, Florian Sittel (www.lettis.net) and Daniel Nagel
3 All rights reserved.
4 
5 Redistribution and use in source and binary forms, with or without
6 modification, are permitted provided that the following conditions are met:
7 
8 1. Redistributions of source code must retain the above copyright notice, this
9 list of conditions and the following disclaimer.
10 
11 2. Redistributions in binary form must reproduce the above copyright notice,
12 this list of conditions and the following disclaimer in the documentation
13 and/or other materials provided with the distribution.
14 
15 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
16 ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18 DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
19 FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
22 CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
23 OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
24 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25 */
26 #pragma once
27 
28 #include "config.hpp"
29 
30 #include <string>
31 #include <vector>
32 #include <map>
33 #include <tuple>
34 #include <memory>
35 #include <iostream>
36 
38 #if defined(__INTEL_COMPILER)
39  #include <malloc.h>
40 #else
41  #include <mm_malloc.h>
42 #endif
43 
44 #if defined(__INTEL_COMPILER)
45  #define ASSUME_ALIGNED(c) __assume_aligned( (c), DC_MEM_ALIGNMENT)
46 #else
47  #define ASSUME_ALIGNED(c) (c) = (float*) __builtin_assume_aligned( (c), DC_MEM_ALIGNMENT)
48 #endif
49 
55 namespace Clustering {
62 namespace Tools {
64  using Neighbor = std::pair<std::size_t, float>;
66  using Neighborhood = std::map<std::size_t, Clustering::Tools::Neighbor>;
68  void
69  write_pops(std::string fname, std::vector<std::size_t> pops, std::string header_comment,
70  std::map<std::string,float> stringMap);
72  void
73  write_fes(std::string fname, std::vector<float> fes, std::string header_comment,
74  std::map<std::string,float> stringMap);
76  std::vector<std::size_t>
77  read_clustered_trajectory(std::string filename);
79  void
80  write_clustered_trajectory(std::string filename, std::vector<std::size_t> traj,
81  std::string header_comment, std::map<std::string,float> stringMap);
83  template <typename NUM>
84  std::vector<NUM>
85  read_single_column(std::string filename);
87  template <typename NUM>
88  void
89  write_single_column(std::string filename, std::vector<NUM> dat,
90  std::string header_comment, bool with_scientific_format=false);
92  template <typename KEY, typename VAL>
93  void
94  write_map(std::string filename, std::map<KEY, VAL> mapping,
95  std::string header_comment, bool val_then_key=false);
97  std::vector<float>
98  read_free_energies(std::string filename);
101  std::vector<std::size_t>
102  read_concat_limits(std::string filename);
105  std::pair<Neighborhood, Neighborhood>
106  read_neighborhood(const std::string fname);
109  void
110  write_neighborhood(const std::string fname,
111  const Neighborhood& nh,
112  const Neighborhood& nh_high_dens,
113  std::string header_comment,
114  std::map<std::string,float> stringMap);
116  std::map<std::size_t, std::size_t>
117  microstate_populations(std::vector<std::size_t> traj);
122  template <typename NUM>
123  std::tuple<NUM*, std::size_t, std::size_t>
124  read_coords(std::string filename,
125  std::vector<std::size_t> usecols = std::vector<std::size_t>());
127  template <typename NUM>
128  void
129  free_coords(NUM* coords);
132  template <typename NUM>
133  std::vector<NUM>
134  dim1_sorted_coords(const NUM* coords
135  , std::size_t n_rows
136  , std::size_t n_cols);
140  template <typename NUM>
141  std::vector<NUM>
142  boxlimits(const std::vector<NUM>& xs
143  , std::size_t boxsize
144  , std::size_t n_rows
145  , std::size_t n_cols);
147  template <typename NUM>
148  std::pair<std::size_t, std::size_t>
149  min_max_box(const std::vector<NUM>& limits
150  , NUM val
151  , NUM radius);
153  unsigned int
154  min_multiplicator(unsigned int orig
155  , unsigned int mult);
157  std::string
158  stringprintf(const std::string& str, ...);
160  template <typename NUM>
161  NUM
162  string_to_num(const std::string &s);
164  template <typename T>
165  std::vector<T>
166  unique_elements(std::vector<T> xs);
168  void
169  check_concat_limits(std::vector<std::size_t> concat_limits,
170  std::size_t n_frames);
172  void
173  read_comments(std::string filename, std::map<std::string,float> &stringMap);
175  float
176  read_next_float(std::ifstream &ifs);
178  void
179  append_commentsMap(std::string &header_comment, std::map<std::string,float> &stringMap);
180 } // end namespace 'Tools'
181 } // end namespace 'Clustering'
182 
183 // template implementations
184 #include "tools.hxx"
185 
void write_pops(std::string filename, std::vector< std::size_t > pops, std::string header_comment, std::map< std::string, float > stringMap)
write populations as column into given file
Definition: tools.cpp:50
std::vector< std::size_t > read_concat_limits(std::string filename)
Definition: tools.cpp:133
std::tuple< NUM *, std::size_t, std::size_t > read_coords(std::string filename, std::vector< std::size_t > usecols=std::vector< std::size_t >())
Definition: tools.hxx:41
general namespace for clustering package
Definition: coring.cpp:38
std::map< std::size_t, std::size_t > microstate_populations(std::vector< std::size_t > traj)
compute microstate populations from clustered trajectory
Definition: tools.cpp:176
std::vector< NUM > dim1_sorted_coords(const NUM *coords, std::size_t n_rows, std::size_t n_cols)
Definition: tools.hxx:122
float read_next_float(std::ifstream &ifs)
read the next float of ifstream
Definition: tools.cpp:207
std::vector< float > read_free_energies(std::string filename)
read free energies from plain text file
Definition: tools.cpp:96
void free_coords(NUM *coords)
free memory pointing to coordinates
Definition: tools.hxx:116
void check_concat_limits(std::vector< std::size_t > concat_limits, std::size_t n_frames)
check if concat limits were passed correctly
Definition: tools.cpp:189
NUM string_to_num(const std::string &s)
convert std::string to number of given template format
Definition: tools.hxx:276
unsigned int min_multiplicator(unsigned int orig, unsigned int mult)
return minimum multiplicator to fulfill result * mult >= orig
Definition: tools.cpp:36
void write_map(std::string filename, std::map< KEY, VAL > mapping, std::string header_comment, bool val_then_key=false)
write key-value map to plain text file with key as first and value as second column ...
Definition: tools.hxx:209
std::pair< std::size_t, float > Neighbor
matches neighbor&#39;s frame id to distance
Definition: tools.hpp:64
void write_neighborhood(const std::string filename, const Neighborhood &nh, const Neighborhood &nh_high_dens, std::string header_comment, std::map< std::string, float > stringMap)
Definition: tools.cpp:144
std::map< std::size_t, Clustering::Tools::Neighbor > Neighborhood
map frame id to neighbors
Definition: tools.hpp:66
void read_comments(std::string filename, std::map< std::string, float > &stringMap)
read comments of stringMap from file. Comments should start with #@
Definition: tools.cpp:229
std::pair< Neighborhood, Neighborhood > read_neighborhood(const std::string filename)
Definition: tools.cpp:101
void append_commentsMap(std::string &header_comment, std::map< std::string, float > &stringMap)
append commentsMap to header comment
Definition: tools.cpp:267
std::vector< T > unique_elements(std::vector< T > xs)
return distinct elements of vector
Definition: tools.hxx:285
void write_single_column(std::string filename, std::vector< NUM > dat, std::string header_comment, bool with_scientific_format=false)
write single column of numbers to given file. number type (int, float, ...) given as template paramet...
Definition: tools.hxx:258
void write_fes(std::string filename, std::vector< float > fes, std::string header_comment, std::map< std::string, float > stringMap)
write free energies as column into given file
Definition: tools.cpp:42
void write_clustered_trajectory(std::string filename, std::vector< std::size_t > traj, std::string header_comment, std::map< std::string, float > stringMap)
write state trajectory into plain text file
Definition: tools.cpp:63
std::vector< NUM > boxlimits(const std::vector< NUM > &xs, std::size_t boxsize, std::size_t n_rows, std::size_t n_cols)
Definition: tools.hxx:159
std::vector< NUM > read_single_column(std::string filename)
read single column of numbers from given file. number type (int, float, ...) given as template parame...
Definition: tools.hxx:230
std::vector< std::size_t > read_clustered_trajectory(std::string filename)
read states from trajectory (given as plain text file)
Definition: tools.cpp:58
std::string stringprintf(const std::string &str,...)
printf-version for std::string
Definition: tools.cpp:80
std::pair< std::size_t, std::size_t > min_max_box(const std::vector< NUM > &limits, NUM val, NUM radius)
return indices of min and max boxes around value for given radius.
Definition: tools.hxx:179