|
YODA - Yet more Objects for Data Analysis 2.1.0
|
Go to the documentation of this file.
6#ifndef YODA_READERUTILS_H
7#define YODA_READERUTILS_H
21#include <YODA/highfive/H5File.hpp>
23#include <highfive/H5File.hpp>
24#define YODA_H5 HighFive
47 static const std::regex regex_string_pat( "([\"\'])(?:(?=(\\\\?))\\2.)*?\\1");
55 class aistringstream {
58 aistringstream( const char* line=0) {
63 aistringstream( const string& line) {
71 bool peek( const std::string& s) const {
72 return s == std::string(_next, s.size());
76 void reset( const char* line=0) {
77 _next = const_cast<char* >(line);
82 void reset( const string& line) { reset(line.c_str()); }
86 aistringstream& operator >> (T& value) {
88 if (_new_next == _next) _error = true;
94 operator bool() const { return !_error; }
101 _locale_set = newlocale(LC_NUMERIC_MASK, "C", NULL);
102 _locale_prev = uselocale(_locale_set);
104 throw ReadError(std::string( "Error setting locale: ") + strerror(errno));
107 void _reset_locale() {
108 if (!uselocale(_locale_prev)) {
109 throw ReadError(std::string( "Error setting locale: ") + strerror(errno));
111 freelocale(_locale_set);
114 void _get( double& x) { x = std::strtod(_next, &_new_next); }
115 void _get( float& x) { x = std::strtof(_next, &_new_next); }
116 void _get( int& i) { i = std::strtol(_next, &_new_next, 10); }
117 void _get( long& i) { i = std::strtol(_next, &_new_next, 10); }
118 void _get( unsigned int& i) { i = std::strtoul(_next, &_new_next, 10); }
119 void _get( long unsigned int& i) { i = std::strtoul(_next, &_new_next, 10); }
120 void _get( string& x) {
121 while (std::isspace(*_next) && _next[0] != '\0') _next += 1;
123 while (!std::isspace(*_new_next) && _new_next[0] != '\0') _new_next += 1;
124 x = string(_next, _new_next-_next);
127 locale_t _locale_set, _locale_prev;
128 char *_next, *_new_next;
141 virtual void parse( const string& line) = 0;
157 if constexpr (std::is_same<T, std::string>::value) {
158 string::const_iterator initpos( line.cbegin() );
159 const string::const_iterator finpos( line.cend() );
161 while ( std::regex_search(initpos, finpos, m, regex_string_pat) ) {
163 std::stringstream ss(m[0].str());
164 ss >> std::quoted(label);
165 vec.push_back(label);
166 initpos = m.suffix().first;
170 std::string content = line.substr(line.find( ": [")+3);
172 for ( const std::string& item : Utils::split(content, ",")) {
176 vec.push_back(std::move(tmp));
202 double sumw(0), sumw2(0), n(0);
203 aiss >> sumw >> sumw2 >> n;
204 dbn = Dbn0D(n, sumw, sumw2);
218 auto* ao = new Counter(h5file. path(), annos.back());
220 ao->deserializeMeta(annos);
233 vector<string> sources;
235 void readErrors(std::map< string,std::pair<double,double>>& errors) {
237 for ( size_t i = 0; i < sources.size(); ++i) {
239 if (eDn != "---" && eUp != "---") {
240 errors[sources[i]] = { Utils::toDbl(eDn), Utils::toDbl(eUp) };
248 if (!line.rfind( "ErrorLabels: ", 0)) {
249 extractVector<std::string>(line, sources);
256 std::map<string,std::pair<double,double>> errors;
274 ao->deserializeMeta(annos);
292 vector<PointND<N>> points;
295 void readCoords(vector<double>& vals, vector<double>& errm, vector<double>& errp) {
296 if constexpr(I < N) {
297 double v(0), em(0), ep(0);
298 aiss >> v >> em >> ep;
302 readCoords<I+1>(vals, errm, errp);
310 vector<double> vals(N), errm(N), errp(N);
311 readCoords<0>(vals, errm, errp);
312 points.push_back( PointND<N>(vals, errm, errp));
318 ao->addPoints(points);
329 ao->deserializeMeta(annos);
338 template < size_t DbnN, typename... AxisT>
344 using is_CAxis = typename std::is_floating_point< typename std::tuple_element_t<I, std::tuple<AxisT...>>>;
346 std::tuple<vector<AxisT> ...> edges;
348 vector<Dbn<DbnN>> dbns;
349 vector<size_t> maskedBins;
350 std::array<double,DbnN*(DbnN-1)/2> crossTerms;
351 bool isYODA1 = false;
352 size_t axisCheck = 0;
357 if constexpr(I < sizeof...(AxisT)) {
358 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
359 if constexpr (is_CAxis<I>::value) {
362 auto& curr_edges = std::get<I>(edges);
363 if (!std::isinf(lo)) {
364 if (curr_edges.empty()) curr_edges.push_back(lo);
366 if (!std::isinf(hi)) {
367 if (curr_edges.size() && curr_edges[ curr_edges.size() - 1 ] != hi) {
368 curr_edges.push_back(hi);
373 throw BinningError( "Discrete axes are not supported in this YODA1-style legacy format.");
380 void readEdges( const std::string& line) {
381 if constexpr(I < sizeof...(AxisT)) {
382 if (I == axisCheck) {
383 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
384 auto& curr_edges = std::get<I>(edges);
385 extractVector<EdgeT>(line, curr_edges);
387 readEdges<I+1>(line);
395 if constexpr(I < sizeof...(AxisT)) {
396 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
397 auto& curr_edges = std::get<I>(edges);
399 loadEdges<I+1>(h5file);
405 if constexpr(I < sizeof...(AxisT)) {
406 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
408 skipEdges<I+1>(h5file);
415 void readDbn(std::array<double,DbnN+1>& sumW, std::array<double,DbnN+1>& sumW2) {
416 if constexpr(I <= DbnN) {
421 readDbn<I+1>(sumW, sumW2);
425 template < class tupleT, size_t... Is>
426 BaseT* make_from_tuple(tupleT&& tuple, std::index_sequence<Is...> ) {
427 BaseT* rtn = new BaseT{std::get<Is>(std::forward<tupleT>(tuple))...};
428 rtn->maskBins(maskedBins);
432 template < class tupleT>
433 BaseT* make_from_tuple(tupleT&& tuple) {
434 return make_from_tuple(std::forward<tupleT>(tuple),
435 std::make_index_sequence< sizeof...(AxisT)+1>{});
440 if constexpr(I < sizeof...(AxisT)) {
441 std::get<I>(edges).clear();
449 if (line.find( "Total") != string::npos) {
453 if (!line.rfind( "Edges(A", 0)) {
458 if (!line.rfind( "MaskedBins: ", 0)) {
459 extractVector<size_t>(line, maskedBins);
463 if (line.find( "Underflow") != string::npos || line.find( "Overflow") != string::npos) {
465 if constexpr ( sizeof...(AxisT) == 1) {
467 aiss >> tmp1 >> tmp2;
470 else if (isYODA1) readEdges<0>();
471 std::array<double,DbnN+1> sumW, sumW2;
472 readDbn<0>(sumW, sumW2);
473 for ( size_t i = 0; i < crossTerms.size(); ++i) {
476 crossTerms.at(i) = tmp;
478 double numEntries(0);
480 if (line.find( "Overflow") != string::npos) {
481 if constexpr ( sizeof...(AxisT) == 1) {
482 if constexpr (DbnN < 2)
483 yoda1Overflow = Dbn<DbnN>(numEntries, sumW, sumW2);
485 yoda1Overflow = Dbn<DbnN>(numEntries, sumW, sumW2, crossTerms);
489 if constexpr (DbnN < 2) {
490 dbns.emplace_back(numEntries, sumW, sumW2);
493 dbns.emplace_back(numEntries, sumW, sumW2, crossTerms);
500 auto args = std::tuple_cat(edges, std::make_tuple(path));
501 BaseT* ao = make_from_tuple(std::move(args));
503 size_t global_index = 0;
504 if constexpr ( sizeof...(AxisT) == 2) {
506 for ( size_t ix = 1; ix < ao->numBinsAt(0)+1; ++ix) {
507 for ( size_t iy = 1; iy < ao->numBinsAt(1)+1; ++iy) {
508 ao->bin(ix,iy).set(std::move(dbns[global_index++]));
513 if ( !(isYODA1 && sizeof...(AxisT) == 2) ) {
514 for ( auto&& d : dbns) {
515 ao->bin(global_index++).set(std::move(d));
519 if constexpr ( sizeof...(AxisT) == 1) {
520 if (isYODA1) ao->bin(global_index).set(yoda1Overflow);
536 loadEdges<0>(h5file);
539 auto args = std::tuple_cat(edges, std::make_tuple(h5file. path(), annos.back()));
540 BaseT* ao = make_from_tuple(std::move(args));
542 ao->deserializeMeta(annos);
550 skipEdges<0>(h5file);
560 template < typename... AxisT>
565 std::tuple<vector<AxisT> ...> edges;
566 vector<Estimate> estimates;
567 vector<size_t> maskedBins;
568 vector<string> sources;
569 size_t axisCheck = 0;
573 void readEdges( const std::string& line) {
574 if constexpr(I < sizeof...(AxisT)) {
575 if (I == axisCheck) {
576 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
577 auto& curr_edges = std::get<I>(edges);
578 extractVector<EdgeT>(line, curr_edges);
580 readEdges<I+1>(line);
584 void readErrors(std::map< string,std::pair<double,double>>& errors) {
586 for ( const std::string& src : sources) {
588 if (eDn != "---" && eUp != "---") {
589 errors[src] = { Utils::toDbl(eDn), Utils::toDbl(eUp) };
598 if constexpr(I < sizeof...(AxisT)) {
599 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
600 auto& curr_edges = std::get<I>(edges);
602 loadEdges<I+1>(h5file);
608 if constexpr(I < sizeof...(AxisT)) {
609 using EdgeT = std::tuple_element_t<I, std::tuple<AxisT...>>;
611 skipEdges<I+1>(h5file);
617 template < class tupleT, size_t... Is>
618 BaseT* make_from_tuple(tupleT&& tuple, std::index_sequence<Is...> ) {
619 BaseT* rtn = new BaseT{std::get<Is>(std::forward<tupleT>(tuple))...};
620 rtn->maskBins(maskedBins);
624 template < class tupleT>
625 BaseT* make_from_tuple(tupleT&& tuple) {
626 return make_from_tuple(std::forward<tupleT>(tuple),
627 std::make_index_sequence< sizeof...(AxisT)+1>{});
632 if constexpr(I < sizeof...(AxisT)) {
633 std::get<I>(edges).clear();
641 if (!line.rfind( "Edges(A", 0)) {
646 if (!line.rfind( "MaskedBins: ", 0)) {
647 extractVector<size_t>(line, maskedBins);
650 if (!line.rfind( "ErrorLabels: ", 0)) {
651 extractVector<std::string>(line, sources);
658 std::map<string,std::pair<double,double>> errors;
660 estimates.emplace_back(val, errors);
665 auto args = std::tuple_cat(edges, std::make_tuple(path));
666 BaseT* ao = make_from_tuple(std::move(args));
668 size_t global_index = 0;
669 for ( auto&& e : estimates) {
670 ao->bin(global_index++) = std::move(e);
684 loadEdges<0>(h5file);
688 auto args = std::tuple_cat(edges, std::make_tuple(h5file. path(), annos.back()));
689 BaseT* ao = make_from_tuple(std::move(args));
691 ao->deserializeMeta(annos);
694 for ( auto& b : ao->bins( true, true)) {
704 skipEdges<0>(h5file);
AOReaderBase() Default constructor.
virtual void skip(H5FileManager &h5file)
virtual void parse(const string &line)=0
virtual ~AOReaderBase() Default destructor.
virtual AnalysisObject * assemble(const string &path="")=0
void extractVector(const std::string &line, std::vector< T > &vec)
virtual AnalysisObject * mkFromH5(H5FileManager &)=0
AnalysisObject * mkFromH5(H5FileManager &h5file)
void skip(H5FileManager &h5file)
void parse(const string &line)
AnalysisObject * assemble(const string &path="")
void parse(const string &line)
void skip(H5FileManager &h5file)
AnalysisObject * mkFromH5(H5FileManager &h5file)
AnalysisObject * assemble(const string &path="")
void parse(const string &line)
AnalysisObject * mkFromH5(H5FileManager &h5file)
AnalysisObject * assemble(const string &path="")
AnalysisObject * assemble(const string &path="")
void parse(const string &line)
AnalysisObject * mkFromH5(H5FileManager &h5file)
void skip(H5FileManager &h5file)
AnalysisObject * mkFromH5(H5FileManager &h5file)
void parse(const string &line)
AnalysisObject * assemble(const string &path="")
AnalysisObject is the base class for histograms and scatters.
User-facing BinnedDbn class in arbitrary dimension.
Error for general binning problems.
Partial template specialisation for Dbn0D.
User-facing Dbn class inheriting from DbnBase.
Helper class to extract AO information from a H5 file.
vector< string > loadSources() noexcept Labels of error sources of current AO.
void skipMasks() noexcept Skips next set of masked indices of current AO.
vector< size_t > loadMasks() noexcept Indices of masked bins in current AO.
const string & path() const Path of current AO.
void skipCommon() noexcept Skips next set of annotations and content of current AO.
vector< EdgeT > loadEdges() noexcept Returns next set of edges of type EdgeT.
vector< string > loadAnnotations() noexcept Serialized annotations of current AO.
vector< double > loadContent() noexcept Serialized content of current AO.
void skipSources() noexcept Skips next set of error sources of current AO.
void skipEdges() noexcept Skips next set of edges of type EdgeT.
Error for file reading errors.
A generic data type which is just a collection of n-dim data points with errors.
Anonymous namespace to limit visibility.
Dbn< 0 > Dbn0D User-friendly aliases.
|