ProteoWizard
Connection_mz5.hpp
Go to the documentation of this file.
1 //
2 // $Id: Connection_mz5.hpp 2819 2011-06-27 18:00:40Z chambm $
3 //
4 //
5 // Original authors: Mathias Wilhelm <mw@wilhelmonline.com>
6 // Marc Kirchner <mail@marc-kirchner.de>
7 //
8 // Copyright 2011 Proteomics Center
9 // Children's Hospital Boston, Boston, MA 02135
10 //
11 // Licensed under the Apache License, Version 2.0 (the "License");
12 // you may not use this file except in compliance with the License.
13 // You may obtain a copy of the License at
14 //
15 // http://www.apache.org/licenses/LICENSE-2.0
16 //
17 // Unless required by applicable law or agreed to in writing, software
18 // distributed under the License is distributed on an "AS IS" BASIS,
19 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
20 // See the License for the specific language governing permissions and
21 // limitations under the License.
22 //
23 
24 #ifndef CONNECTION_MZ5_HPP_
25 #define CONNECTION_MZ5_HPP_
26 
27 #include "../MSData.hpp"
28 #include "Configuration_mz5.hpp"
29 #include <string>
30 #include <vector>
31 
32 namespace pwiz {
33 namespace msdata {
34 namespace mz5 {
35 
36 /**
37  * This class is used for reading and writing information to a mz5 file.
38  * On destruction it will automatically close all existing datasets and flush the file.
39  */
41 {
42 public:
43  /**
44  * mz5 file open policy.
45  */
47  {
48  /**
49  * Fails if the file already exists.
50  */
52  /**
53  * If file exists, it will be deleted and created empty.
54  */
56  /**
57  * Open file with read and write support.
58  */
60  /**
61  * Open file with read only support.
62  */
64  };
65 
66  /**
67  * Default constructor.
68  *
69  * When opening a file, which is a hdf5 file but no mz5 file, a runtime_error is thrown.
70  *
71  * @param filename file name
72  * @param op open policy
73  * @param configuration configuration used to determine chunk and buffer sizes
74  */
75  Connection_mz5(const std::string filename, const OpenPolicy op =
76  ReadOnly, const Configuration_mz5 config =
78 
79  /**
80  * Closes all open datasets and flushes file to filesystem.
81  */
83 
84  /**
85  * Creates and write a one dimensional dataset.
86  * @param size size of the dataset
87  * @param data void pointer to the dataset beginning
88  * @param v dataset enumeration value
89  */
90  void createAndWrite1DDataSet(hsize_t size, void* data,
92 
93  /**
94  * Extends data of to a dataset. This method automatically uses an internal buffer to write the data and calls extendsAndWrite1DDataSet()
95  * @param d1 data
96  * @param v dataset enumeration value
97  */
98  void extendData(const std::vector<double>& d1,
100 
101  /**
102  * Returns a list of all existing datasets in this file.
103  */
104  const std::map<Configuration_mz5::MZ5DataSets, size_t>& getFields();
105 
106  /**
107  * Reads a dataset.
108  * If no pointer is set, this method will allocate the needed mememory with calloc. To regain the memory call clean().
109  *
110  * @param v dataset enumeration value
111  * @param dsend dataset size
112  * @param ptr start pointer where the data should be written to.
113  * @return pointer to the data
114  */
115  void* readDataSet(Configuration_mz5::MZ5DataSets v, size_t& dsend,
116  void* ptr = 0);
117 
118  /**
119  * Clean up of open datasets and destruction of corresponding data elements.
120  * This method calls vlenReclaim, free and close.
121  * @param v dataset enumeration value
122  * @param data pointer to the beginning of the data
123  * @param dsend length of the data.
124  */
125  void clean(const Configuration_mz5::MZ5DataSets v, void* data,
126  const size_t dsend);
127 
128  /**
129  * Gets data from a numerical dataset and writes it to the vector. This method is used to get mz,intensity and time.
130  * @param data data vector
131  * @param v dataset enumeration value
132  * @param start start index
133  * @param end end index
134  */
135  void getData(std::vector<double>& data,
136  const Configuration_mz5::MZ5DataSets v, const hsize_t start,
137  const hsize_t end);
138 
139  /**
140  * Getter.
141  * @return current configuration
142  */
144 
145 private:
146 
147  /**
148  * Creates a DSetCreatPropList for a dataset.
149  * @param rank dimensionality of dataset
150  * @param dataset dataset used to determine the name
151  * @param datadim data dimensions
152  * @return DSetCreatPropList
153  */
154  H5::DSetCreatPropList getCParm(int rank,
155  const Configuration_mz5::MZ5DataSets& v, const hsize_t& datadim);
156 
157  /**
158  * Creates a dataset.
159  * @param rank dimensionality of the dataset
160  * @param dim size of each dimension
161  * @param maxdim maximal size of each dimension
162  * @param v dataset enumeration value
163  * @return dataset
164  */
165  H5::DataSet getDataSet(int rank, hsize_t* dim, hsize_t* maxdim,
167 
168  /**
169  * Initializes a file and read internal mz5 information.
170  *
171  * Will throw a runtime_error when the file is not a mz5 file.
172  */
173  void readFile();
174 
175  /**
176  * Extends and appends data to an existing dataset with no buffer.
177  * @param dataset dataset
178  * @param d1 data
179  */
180  void extendAndWrite1DDataSet(const H5::DataSet& dataset, const std::vector<
181  double>& d1);
182 
183  /**
184  * Internal method to add data to a buffer.
185  * @param b buffer
186  * @param d1 data
187  * @param bs buffer size
188  * @param dataset dataset
189  */
190  void addToBuffer(std::vector<double>& b, const std::vector<double>& d1,
191  const size_t bs, const H5::DataSet& dataset);
192 
193  /**
194  * Flushes all data to the hard drive.
195  * @param v dataset enumeration value
196  */
198 
199  /**
200  * Closes the file and flushes all open buffers/datasets.
201  */
202  void close();
203 
204  /**
205  * Existing field in file.
206  */
207  std::map<Configuration_mz5::MZ5DataSets, size_t> fields_;
208  /**
209  * MZ5 file reference.
210  */
211  H5::H5File* file_;
212  /**
213  * mz5 configuration object.
214  */
216  /**
217  * Mapping from a dataset enumeration value to the dataset.
218  */
219  std::map<Configuration_mz5::MZ5DataSets, H5::DataSet> bufferMap_;
220  /**
221  * Mapping from a dataset enumeration value to a buffer.
222  */
223  std::map<Configuration_mz5::MZ5DataSets, std::vector<double> > buffers_;
224  /**
225  * Flag whether file is closed or not.
226  */
227  bool closed_;
228 };
229 
230 }
231 }
232 }
233 
234 #endif /* CONNECTION_MZ5_HPP_ */