guts
gutilities.cc
Go to the documentation of this file.
1 // gutilities
2 #include "gutilities.h"
3 
4 // Numbers / strings with units / io interface to CLHEP units
5 #include "CLHEP/Units/PhysicalConstants.h"
6 
7 // c++
8 // algorithm for 'transform'
9 #include <algorithm>
10 #include <sstream>
11 #include <unordered_map>
12 #include <iostream>
13 #include <fstream>
14 #include <vector>
15 
16 using namespace std;
17 
18 namespace gutilities {
19 
20  string removeLeadingAndTrailingSpacesFromString(const std::string &input) {
21  size_t startPos = input.find_first_not_of(" \t"); // Find the first non-whitespace character
22  size_t endPos = input.find_last_not_of(" \t"); // Find the last non-whitespace character
23 
24  // If all spaces or empty, return an empty string
25  if (startPos == std::string::npos || endPos == std::string::npos) {
26  return "";
27  }
28 
29  // Return the substring between startPos and endPos
30  return input.substr(startPos, endPos - startPos + 1);
31  }
32 
33  string removeAllSpacesFromString(const std::string &str) {
34  string result = str;
35  result.erase(std::remove(result.begin(), result.end(), ' '), result.end());
36  return result;
37  }
38 
39  string getFileFromPath(const std::string &path) {
40  std::size_t lastSlashPos = path.find_last_of('/');
41  if (lastSlashPos == std::string::npos) {
42  // No slashes found, return the entire path
43  return path;
44  }
45  return path.substr(lastSlashPos + 1);
46  }
47 
48  string getDirFromPath(const std::string &path) {
49  auto lastSlash = path.find_last_of('/');
50  if (lastSlash == std::string::npos) return ".";
51  return path.substr(0, lastSlash);
52  }
53 
54  vector <std::string> getStringVectorFromString(const std::string &input) {
55  std::vector <std::string> pvalues;
56  stringstream plist(input);
57  string tmp;
58  while (plist >> tmp) {
59  string trimmed = removeLeadingAndTrailingSpacesFromString(tmp);
60  if (!trimmed.empty()) {
61  pvalues.push_back(trimmed);
62  }
63  }
64  return pvalues;
65  }
66 
67  // Replace all occurences of specific chars in a string with a string
68  string replaceCharInStringWithChars(const std::string &input, const std::string &toReplace, const std::string &replacement) {
69  string output;
70  for (const char &ch: input) {
71  if (toReplace.find(ch) != std::string::npos) {
72  output.append(replacement);
73  } else {
74  output.push_back(ch);
75  }
76  }
77  return output;
78  }
79 
80  string replaceAllStringsWithString(const string &source, const string &from, const string &to) {
81  if (from.empty()) return source; // Avoid infinite loop
82 
83  string newString;
84  size_t lastPos = 0;
85  size_t findPos = source.find(from, lastPos);
86 
87  while (findPos != string::npos) {
88  // Append part before the match and the replacement string
89  newString.append(source, lastPos, findPos - lastPos);
90  newString += to;
91  lastPos = findPos + from.length();
92  findPos = source.find(from, lastPos);
93  }
94 
95  // Append the remaining part of the string after the last occurrence
96  newString += source.substr(lastPos);
97 
98  return newString;
99  }
100 
101 
102  string fillDigits(const string &word, const string &c, int ndigits) {
103  if (c.empty() || ndigits <= static_cast<int>(word.size())) return word; // Return original if no padding needed
104 
105  string filled;
106 
107  int toFill = ndigits - static_cast<int>(word.size());
108  filled.reserve(ndigits);
109 
110  filled.append(toFill, c[0]); // Use the first character of the string 'c'
111  filled += word;
112 
113  return filled;
114  }
115 
116 
117  double getG4Number(const string &v, bool warnIfNotUnit) {
119 
120  // If no '*' is found, the input is assumed to be a number without units
121  if (value.find('*') == string::npos) {
122  if (!value.empty() && warnIfNotUnit && stod(value) != 0) {
123  cerr << " ! Warning: value " << v << " does not contain units." << endl;
124  }
125 
126  try {
127  return stod(value);
128  } catch (const exception &e) {
129  cerr << FATALERRORL << "stod exception in gutilities: could not convert string to double. "
130  << "Value: >" << v << "<, error: " << e.what() << endl;
131  exit(EC__G4NUMBERERROR);
132  }
133  } else {
134  // Split the input string into the numeric part and the unit part
135  size_t pos = value.find('*');
136  string rootValue = value.substr(0, pos);
137  string units = value.substr(pos + 1);
138 
139  double answer = 0;
140  try {
141  answer = stod(rootValue);
142  } catch (const exception &e) {
143  cerr << FATALERRORL << "stod exception in gutilities: could not convert string to double. "
144  << "Value: >" << v << "<, error: " << e.what() << endl;
145  exit(EC__G4NUMBERERROR);
146  }
147 
148  // Map of unit conversions for easier lookup and maintenance
149  static const unordered_map<string, double> unitConversion = {
150  {"m", CLHEP::m},
151  {"cm", CLHEP::cm},
152  {"mm", CLHEP::mm},
153  {"um", 1E-6 * CLHEP::m},
154  {"fm", 1E-15 * CLHEP::m},
155  {"inches", 2.54 * CLHEP::cm},
156  {"inch", 2.54 * CLHEP::cm},
157  {"deg", CLHEP::deg},
158  {"degrees", CLHEP::deg},
159  {"arcmin", CLHEP::deg / 60.0},
160  {"rad", CLHEP::rad},
161  {"mrad", CLHEP::mrad},
162  {"eV", CLHEP::eV},
163  {"MeV", CLHEP::MeV},
164  {"KeV", 0.001 * CLHEP::MeV},
165  {"GeV", CLHEP::GeV},
166  {"T", CLHEP::tesla},
167  {"T/m", CLHEP::tesla / CLHEP::m},
168  {"Tesla", CLHEP::tesla},
169  {"gauss", CLHEP::gauss},
170  {"kilogauss", CLHEP::gauss * 1000},
171  {"s", CLHEP::s},
172  {"ns", CLHEP::ns},
173  {"ms", CLHEP::ms},
174  {"us", CLHEP::us},
175  {"counts", 1}
176  };
177 
178  auto it = unitConversion.find(units);
179  if (it != unitConversion.end()) {
180  answer *= it->second;
181  } else {
182  cerr << GWARNING << ">" << units << "<: unit not recognized for string <" << v << ">" << endl;
183  }
184 
185  return answer;
186  }
187 
188  return 0.0; // Default return in case of unexpected flow
189  }
190 
191  double getG4Number(double input, const string &unit) {
192  string gnumber = to_string(input) + "*" + unit;
193  return getG4Number(gnumber, true);
194  }
195 
196  vector<double> getG4NumbersFromStringVector(const vector <string> &vstring, bool warnIfNotUnit) {
197  vector<double> output;
198  output.reserve(vstring.size());
199 
200  for (const auto &s: vstring) {
201  output.push_back(getG4Number(s, warnIfNotUnit));
202  }
203 
204  return output;
205  }
206 
207  vector<double> getG4NumbersFromString(const string &vstring, bool warnIfNotUnit) {
208  return getG4NumbersFromStringVector(getStringVectorFromStringWithDelimiter(vstring, ","), warnIfNotUnit);
209  }
210 
211 
212  string parseFileAndRemoveComments(const string &filename, const string &commentChars, int verbosity) {
213  // Reading file
214  ifstream in(filename);
215  if (!in) {
216  cerr << FATALERRORL << "can't open input file " << filename << ". Check your spelling. " << endl;
217  exit(EC__FILENOTFOUND);
218  }
219 
220  stringstream strStream;
221  if (verbosity > 0) {
222  cout << endl << CIRCLEITEM << " Loading string from " << filename << endl;
223  }
224  strStream << in.rdbuf(); // Read the file
225  in.close();
226 
227  string parsedString = strStream.str();
228 
229  // Removing all occurrences of commentChars
230  size_t nFPos;
231  while ((nFPos = parsedString.find(commentChars)) != string::npos) {
232  size_t firstNL = parsedString.rfind('\n', nFPos);
233  size_t secondNL = parsedString.find('\n', nFPos);
234  parsedString.erase(firstNL, secondNL - firstNL);
235  }
236 
237  return parsedString;
238  }
239 
240  string retrieveStringBetweenChars(const string &input, const string &firstDelimiter, const string &secondDelimiter) {
241  size_t firstpos = input.find(firstDelimiter);
242  size_t secondpos = input.find(secondDelimiter);
243 
244  if (firstpos == string::npos || secondpos == string::npos) {
245  return "";
246  }
247  return input.substr(firstpos + firstDelimiter.length(), secondpos - firstpos - firstDelimiter.length());
248  }
249 
250  vector <string> getStringVectorFromStringWithDelimiter(const string &input, const string &x) {
251  vector <string> pvalues;
252  string tmp;
253 
254  for (char ch: input) {
255  if (ch != x[0]) {
256  tmp += ch;
257  } else {
258  if (!tmp.empty()) {
259  pvalues.push_back(removeLeadingAndTrailingSpacesFromString(tmp));
260  tmp.clear();
261  }
262  }
263  }
264 
265  if (!tmp.empty()) {
266  pvalues.push_back(removeLeadingAndTrailingSpacesFromString(tmp));
267  }
268 
269  return pvalues;
270  }
271 
272 
273 // string search for a path with <name> from a possible list of absolute paths
274 // returns UNINITIALIZEDSTRINGQUANTITY if not found
275 // the filesystem solution does not work on linux systems.
276 // TODO: periodically try this?
277 //#include <filesystem>
278 //
279 // string searchForDirInLocations(string dirName, vector <string> possibleLocations) {
280 //
281 // for (auto trialLocation: possibleLocations) {
282 // string possibleDir = trialLocation + "/" + dirName;
283 // if (std::filesystem::exists(possibleDir)) {
284 // return possibleDir;
285 // }
286 // }
287 // return UNINITIALIZEDSTRINGQUANTITY;
288 // }
289 //
290 // vector <string> getListOfFilesInDirectory(string dirName, vector <string> extensions) {
291 //
292 // vector <string> fileList;
293 //
294 // for (const auto &entry: std::filesystem::directory_iterator(dirName)) {
295 // for (auto &extension: extensions) {
296 // if (entry.path().extension() == extension) {
297 // fileList.push_back(entry.path().filename());
298 // }
299 // }
300 // }
301 //
302 // return fileList;
303 // }
304 // end of TODO
305 
306 #include <dirent.h>
307 #include <sys/stat.h>
308 
309  bool directoryExists(const std::string &path) {
310  struct stat info;
311  if (stat(path.c_str(), &info) != 0) {
312  return false; // Path does not exist
313  }
314  return (info.st_mode & S_IFDIR) != 0; // Check if it's a directory
315  }
316 
317  string searchForDirInLocations(const string &dirName, const vector <string> &possibleLocations) {
318  for (const auto &trialLocation: possibleLocations) {
319  string possibleDir = trialLocation + "/" + dirName;
320  if (directoryExists(possibleDir)) {
321  return possibleDir;
322  }
323  }
324  return "UNINITIALIZEDSTRINGQUANTITY";
325  }
326 
327 
328  bool hasExtension(const std::string &filename, const std::vector <std::string> &extensions) {
329  for (const auto &ext: extensions) {
330  if (filename.size() >= ext.size() &&
331  filename.compare(filename.size() - ext.size(), ext.size(), ext) == 0) {
332  return true;
333  }
334  }
335  return false;
336  }
337 
338  vector <string> getListOfFilesInDirectory(const string &dirName, const vector <string> &extensions) {
339  vector <string> fileList;
340 
341  DIR *dir = opendir(dirName.c_str());
342  if (dir) {
343  struct dirent *entry;
344  while ((entry = readdir(dir)) != nullptr) {
345  struct stat info;
346  string filepath = dirName + "/" + entry->d_name;
347  if (stat(filepath.c_str(), &info) == 0 && S_ISREG(info.st_mode)) {
348  string filename = entry->d_name;
349  if (hasExtension(filename, extensions)) {
350  fileList.push_back(filename);
351  }
352  }
353  }
354  closedir(dir);
355  }
356 
357  return fileList;
358  }
359 
360  string convertToLowercase(const string &str) {
361  string lower = str;
362  transform(lower.begin(), lower.end(), lower.begin(), ::tolower);
363  return lower;
364  }
365 
366 
367  template<class KEY, class VALUE>
368  vector<KEY> getKeys(const map<KEY, VALUE>& map) {
369  vector<KEY> keys;
370  keys.reserve(map.size()); // Reserve space for efficiency
371 
372  for (const auto& it : map) {
373  keys.push_back(it.first);
374  }
375 
376  return keys;
377  }
378 
379  randomModel stringToRandomModel(const std::string &str) {
380  static const std::unordered_map <std::string, randomModel> strToEnum = {
381  {"uniform", uniform},
382  {"gaussian", gaussian},
383  {"cosine", cosine},
384  {"sphere", sphere}
385  };
386 
387  auto it = strToEnum.find(str);
388  if (it != strToEnum.end()) {
389  return it->second;
390  } else {
391  throw std::invalid_argument("Invalid string for randomModel: " + str);
392  }
393  }
394 
395 
396 }
#define GWARNING
Warning label.
#define EC__FILENOTFOUND
File not found error code.
#define CIRCLEITEM
Symbol for circle item.
#define EC__G4NUMBERERROR
G4 number error code.
#define FATALERRORL
Fatal error label.
string replaceAllStringsWithString(const string &source, const string &from, const string &to)
Replaces all occurrences of a substring with another string.
Definition: gutilities.cc:80
bool hasExtension(const std::string &filename, const std::vector< std::string > &extensions)
Checks if a filename has one of the specified extensions.
Definition: gutilities.cc:328
vector< double > getG4NumbersFromString(const string &vstring, bool warnIfNotUnit)
Converts a comma-separated string of numbers with units to a vector of doubles.
Definition: gutilities.cc:207
string removeAllSpacesFromString(const std::string &str)
Removes all spaces from a string.
Definition: gutilities.cc:33
vector< string > getStringVectorFromStringWithDelimiter(const string &input, const string &x)
Splits a string into a vector of substrings using a specified delimiter.
Definition: gutilities.cc:250
randomModel stringToRandomModel(const std::string &str)
Converts a string to a corresponding randomModel enum value.
Definition: gutilities.cc:379
vector< string > getListOfFilesInDirectory(const string &dirName, const vector< string > &extensions)
Retrieves a list of files with specific extensions from a directory.
Definition: gutilities.cc:338
vector< double > getG4NumbersFromStringVector(const vector< string > &vstring, bool warnIfNotUnit)
Converts a vector of strings representing numbers with units to a vector of doubles.
Definition: gutilities.cc:196
string retrieveStringBetweenChars(const string &input, const string &firstDelimiter, const string &secondDelimiter)
Retrieves a substring between two specified delimiters in a string.
Definition: gutilities.cc:240
string replaceCharInStringWithChars(const std::string &input, const std::string &toReplace, const std::string &replacement)
Replaces all occurrences of specified characters in a string with another string.
Definition: gutilities.cc:68
string fillDigits(const string &word, const string &c, int ndigits)
Pads a string with a specified character until it reaches a desired length.
Definition: gutilities.cc:102
randomModel
Enumeration of random models.
Definition: gutilities.h:275
@ gaussian
Gaussian distribution.
Definition: gutilities.h:277
@ uniform
Uniform distribution.
Definition: gutilities.h:276
@ sphere
Sphere distribution.
Definition: gutilities.h:279
@ cosine
Cosine distribution.
Definition: gutilities.h:278
string getDirFromPath(const std::string &path)
Extracts the directory path from a given file path.
Definition: gutilities.cc:48
string convertToLowercase(const string &str)
Converts a string to lowercase.
Definition: gutilities.cc:360
bool directoryExists(const std::string &path)
Checks if a directory exists at the given path.
Definition: gutilities.cc:309
vector< KEY > getKeys(const map< KEY, VALUE > &map)
Retrieves all keys from a map.
Definition: gutilities.cc:368
string removeLeadingAndTrailingSpacesFromString(const std::string &input)
Removes leading and trailing spaces and tabs from a string.
Definition: gutilities.cc:20
string searchForDirInLocations(const string &dirName, const vector< string > &possibleLocations)
Searches for a directory within a list of possible locations.
Definition: gutilities.cc:317
string parseFileAndRemoveComments(const string &filename, const string &commentChars, int verbosity)
Parses a file and removes all lines containing specified comment characters.
Definition: gutilities.cc:212
string getFileFromPath(const std::string &path)
Extracts the filename from a given file path.
Definition: gutilities.cc:39
vector< std::string > getStringVectorFromString(const std::string &input)
Splits a string into a vector of strings using spaces as delimiters.
Definition: gutilities.cc:54
double getG4Number(double input, const string &unit)
Converts a numeric value with a unit into a G4 number format and returns the converted value.
Definition: gutilities.cc:191