common.h 33.2 KB
Newer Older
1
2
3
4
/*!
 * Copyright (c) 2016 Microsoft Corporation. All rights reserved.
 * Licensed under the MIT License. See LICENSE file in the project root for license information.
 */
5
6
#ifndef LIGHTGBM_UTILS_COMMON_H_
#define LIGHTGBM_UTILS_COMMON_H_
Guolin Ke's avatar
Guolin Ke committed
7

8
#include <LightGBM/utils/json11.h>
9
10
11
#include <LightGBM/utils/log.h>
#include <LightGBM/utils/openmp_wrapper.h>

12
#include <limits>
Guolin Ke's avatar
Guolin Ke committed
13
#include <string>
14
#include <algorithm>
15
#include <chrono>
16
#include <cmath>
17
18
#include <cstdint>
#include <cstdio>
Chen Yufei's avatar
Chen Yufei committed
19
#include <cstdlib>
20
#include <cstring>
Guolin Ke's avatar
Guolin Ke committed
21
#include <functional>
22
#include <iomanip>
23
#include <iterator>
24
#include <map>
25
26
#include <memory>
#include <sstream>
Guolin Ke's avatar
Guolin Ke committed
27
#include <type_traits>
28
#include <unordered_map>
29
30
#include <utility>
#include <vector>
Guolin Ke's avatar
Guolin Ke committed
31

32
33
34
35
36
37
#if (!((defined(sun) || defined(__sun)) && (defined(__SVR4) || defined(__svr4__))))
#define FMT_HEADER_ONLY
#include "../../../external_libs/fmt/include/fmt/format.h"
#endif
#include "../../../external_libs/fast_double_parser/include/fast_double_parser.h"

38
39
40
41
42
#ifdef _MSC_VER
#include <intrin.h>
#pragma intrinsic(_BitScanReverse)
#endif

43
#if defined(_MSC_VER)
44
45
46
#include <malloc.h>
#elif MM_MALLOC
#include <mm_malloc.h>
47
48
49
50
51
52
// https://gcc.gnu.org/onlinedocs/cpp/Common-Predefined-Macros.html
// https://www.oreilly.com/library/view/mac-os-x/0596003560/ch05s01s02.html
#elif defined(__GNUC__) && defined(HAVE_MALLOC_H)
  #include <malloc.h>
  #define _mm_malloc(a, b) memalign(b, a)
  #define _mm_free(a) free(a)
53
54
55
56
#else
#include <stdlib.h>
#define _mm_malloc(a, b) malloc(a)
#define _mm_free(a) free(a)
57
58
#endif

Guolin Ke's avatar
Guolin Ke committed
59
60
61
62
namespace LightGBM {

namespace Common {

63
64
using json11::Json;

65
66
67
68
69
70
71
/*!
* Imbues the stream with the C locale.
*/
static void C_stringstream(std::stringstream &ss) {
  ss.imbue(std::locale::classic());
}

72
inline static char tolower(char in) {
Guolin Ke's avatar
Guolin Ke committed
73
74
75
76
77
  if (in <= 'Z' && in >= 'A')
    return in - ('Z' - 'z');
  return in;
}

78
inline static std::string Trim(std::string str) {
Guolin Ke's avatar
Guolin Ke committed
79
  if (str.empty()) {
Guolin Ke's avatar
Guolin Ke committed
80
81
82
83
84
85
86
    return str;
  }
  str.erase(str.find_last_not_of(" \f\n\r\t\v") + 1);
  str.erase(0, str.find_first_not_of(" \f\n\r\t\v"));
  return str;
}

87
inline static std::string RemoveQuotationSymbol(std::string str) {
Guolin Ke's avatar
Guolin Ke committed
88
  if (str.empty()) {
89
90
91
92
93
94
    return str;
  }
  str.erase(str.find_last_not_of("'\"") + 1);
  str.erase(0, str.find_first_not_of("'\""));
  return str;
}
Guolin Ke's avatar
Guolin Ke committed
95

Guolin Ke's avatar
Guolin Ke committed
96
97
98
99
100
101
102
inline static bool StartsWith(const std::string& str, const std::string prefix) {
  if (str.substr(0, prefix.size()) == prefix) {
    return true;
  } else {
    return false;
  }
}
Guolin Ke's avatar
Guolin Ke committed
103

Guolin Ke's avatar
Guolin Ke committed
104
inline static std::vector<std::string> Split(const char* c_str, char delimiter) {
Guolin Ke's avatar
Guolin Ke committed
105
  std::vector<std::string> ret;
Guolin Ke's avatar
Guolin Ke committed
106
107
  std::string str(c_str);
  size_t i = 0;
Guolin Ke's avatar
Guolin Ke committed
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
  size_t pos = 0;
  while (pos < str.length()) {
    if (str[pos] == delimiter) {
      if (i < pos) {
        ret.push_back(str.substr(i, pos - i));
      }
      ++pos;
      i = pos;
    } else {
      ++pos;
    }
  }
  if (i < pos) {
    ret.push_back(str.substr(i));
  }
  return ret;
}

126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
inline static std::vector<std::string> SplitBrackets(const char* c_str, char left_delimiter, char right_delimiter) {
  std::vector<std::string> ret;
  std::string str(c_str);
  size_t i = 0;
  size_t pos = 0;
  bool open = false;
  while (pos < str.length()) {
    if (str[pos] == left_delimiter) {
      open = true;
      ++pos;
      i = pos;
    } else if (str[pos] == right_delimiter && open) {
      if (i < pos) {
        ret.push_back(str.substr(i, pos - i));
      }
      open = false;
      ++pos;
    } else {
      ++pos;
    }
  }
  return ret;
}

Guolin Ke's avatar
Guolin Ke committed
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
inline static std::vector<std::string> SplitLines(const char* c_str) {
  std::vector<std::string> ret;
  std::string str(c_str);
  size_t i = 0;
  size_t pos = 0;
  while (pos < str.length()) {
    if (str[pos] == '\n' || str[pos] == '\r') {
      if (i < pos) {
        ret.push_back(str.substr(i, pos - i));
      }
      // skip the line endings
      while (str[pos] == '\n' || str[pos] == '\r') ++pos;
      // new begin
      i = pos;
    } else {
      ++pos;
    }
  }
  if (i < pos) {
    ret.push_back(str.substr(i));
Guolin Ke's avatar
Guolin Ke committed
170
171
172
173
  }
  return ret;
}

Guolin Ke's avatar
Guolin Ke committed
174
175
176
177
inline static std::vector<std::string> Split(const char* c_str, const char* delimiters) {
  std::vector<std::string> ret;
  std::string str(c_str);
  size_t i = 0;
Guolin Ke's avatar
Guolin Ke committed
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
  size_t pos = 0;
  while (pos < str.length()) {
    bool met_delimiters = false;
    for (int j = 0; delimiters[j] != '\0'; ++j) {
      if (str[pos] == delimiters[j]) {
        met_delimiters = true;
        break;
      }
    }
    if (met_delimiters) {
      if (i < pos) {
        ret.push_back(str.substr(i, pos - i));
      }
      ++pos;
      i = pos;
    } else {
      ++pos;
    }
  }
  if (i < pos) {
    ret.push_back(str.substr(i));
Guolin Ke's avatar
Guolin Ke committed
199
200
201
202
  }
  return ret;
}

203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
inline static std::string GetFromParserConfig(std::string config_str, std::string key) {
  // parser config should follow json format.
  std::string err;
  Json config_json = Json::parse(config_str, &err);
  if (!err.empty()) {
    Log::Fatal("Invalid parser config: %s. Please check if follow json format.", err.c_str());
  }
  return config_json[key].string_value();
}

inline static std::string SaveToParserConfig(std::string config_str, std::string key, std::string value) {
  std::string err;
  Json config_json = Json::parse(config_str, &err);
  if (!err.empty()) {
    Log::Fatal("Invalid parser config: %s. Please check if follow json format.", err.c_str());
  }
  CHECK(config_json.is_object());
  std::map<std::string, Json> config_map = config_json.object_items();
  config_map.insert(std::pair<std::string, Json>(key, Json(value)));
  return Json(config_map).dump();
}

225
226
227
228
template<typename T>
inline static const char* Atoi(const char* p, T* out) {
  int sign;
  T value;
Guolin Ke's avatar
Guolin Ke committed
229
230
231
232
233
234
235
  while (*p == ' ') {
    ++p;
  }
  sign = 1;
  if (*p == '-') {
    sign = -1;
    ++p;
236
  } else if (*p == '+') {
Guolin Ke's avatar
Guolin Ke committed
237
238
239
240
241
    ++p;
  }
  for (value = 0; *p >= '0' && *p <= '9'; ++p) {
    value = value * 10 + (*p - '0');
  }
242
  *out = static_cast<T>(sign * value);
Guolin Ke's avatar
Guolin Ke committed
243
244
245
246
247
248
  while (*p == ' ') {
    ++p;
  }
  return p;
}

249
template<typename T>
250
251
252
253
254
255
256
257
258
259
260
261
262
263
inline static double Pow(T base, int power) {
  if (power < 0) {
    return 1.0 / Pow(base, -power);
  } else if (power == 0) {
    return 1;
  } else if (power % 2 == 0) {
    return Pow(base*base, power / 2);
  } else if (power % 3 == 0) {
    return Pow(base*base*base, power / 3);
  } else {
    return base * Pow(base, power - 1);
  }
}

264
inline static const char* Atof(const char* p, double* out) {
Guolin Ke's avatar
Guolin Ke committed
265
  int frac;
266
  double sign, value, scale;
Guolin Ke's avatar
Guolin Ke committed
267
  *out = NAN;
Guolin Ke's avatar
Guolin Ke committed
268
269
270
271
272
  // Skip leading white space, if any.
  while (*p == ' ') {
    ++p;
  }
  // Get sign, if any.
273
  sign = 1.0;
Guolin Ke's avatar
Guolin Ke committed
274
  if (*p == '-') {
275
    sign = -1.0;
Guolin Ke's avatar
Guolin Ke committed
276
    ++p;
277
  } else if (*p == '+') {
Guolin Ke's avatar
Guolin Ke committed
278
279
280
    ++p;
  }

Guolin Ke's avatar
Guolin Ke committed
281
282
283
  // is a number
  if ((*p >= '0' && *p <= '9') || *p == '.' || *p == 'e' || *p == 'E') {
    // Get digits before decimal point or exponent, if any.
284
285
    for (value = 0.0; *p >= '0' && *p <= '9'; ++p) {
      value = value * 10.0 + (*p - '0');
Guolin Ke's avatar
Guolin Ke committed
286
    }
Guolin Ke's avatar
Guolin Ke committed
287

Guolin Ke's avatar
Guolin Ke committed
288
289
    // Get digits after decimal point, if any.
    if (*p == '.') {
290
291
      double right = 0.0;
      int nn = 0;
Guolin Ke's avatar
Guolin Ke committed
292
      ++p;
Guolin Ke's avatar
Guolin Ke committed
293
      while (*p >= '0' && *p <= '9') {
294
295
        right = (*p - '0') + right * 10.0;
        ++nn;
Guolin Ke's avatar
Guolin Ke committed
296
297
        ++p;
      }
298
      value += right / Pow(10.0, nn);
Guolin Ke's avatar
Guolin Ke committed
299
300
    }

Guolin Ke's avatar
Guolin Ke committed
301
302
    // Handle exponent, if any.
    frac = 0;
303
    scale = 1.0;
Guolin Ke's avatar
Guolin Ke committed
304
    if ((*p == 'e') || (*p == 'E')) {
Guolin Ke's avatar
Guolin Ke committed
305
      uint32_t expon;
Guolin Ke's avatar
Guolin Ke committed
306
      // Get sign of exponent, if any.
Guolin Ke's avatar
Guolin Ke committed
307
      ++p;
Guolin Ke's avatar
Guolin Ke committed
308
309
310
311
312
313
314
315
316
317
      if (*p == '-') {
        frac = 1;
        ++p;
      } else if (*p == '+') {
        ++p;
      }
      // Get digits of exponent, if any.
      for (expon = 0; *p >= '0' && *p <= '9'; ++p) {
        expon = expon * 10 + (*p - '0');
      }
318
319
320
      if (expon > 308) expon = 308;
      // Calculate scaling factor.
      while (expon >= 50) { scale *= 1E50; expon -= 50; }
Guolin Ke's avatar
Guolin Ke committed
321
      while (expon >= 8) { scale *= 1E8;  expon -= 8; }
322
      while (expon > 0) { scale *= 10.0; expon -= 1; }
Guolin Ke's avatar
Guolin Ke committed
323
    }
Guolin Ke's avatar
Guolin Ke committed
324
325
326
    // Return signed and scaled floating point result.
    *out = sign * (frac ? (value / scale) : (value * scale));
  } else {
327
    size_t cnt = 0;
328
    while (*(p + cnt) != '\0' && *(p + cnt) != ' '
329
330
331
           && *(p + cnt) != '\t' && *(p + cnt) != ','
           && *(p + cnt) != '\n' && *(p + cnt) != '\r'
           && *(p + cnt) != ':') {
332
333
      ++cnt;
    }
334
    if (cnt > 0) {
Guolin Ke's avatar
Guolin Ke committed
335
      std::string tmp_str(p, cnt);
Guolin Ke's avatar
Guolin Ke committed
336
      std::transform(tmp_str.begin(), tmp_str.end(), tmp_str.begin(), Common::tolower);
zhangjin's avatar
zhangjin committed
337
338
      if (tmp_str == std::string("na") || tmp_str == std::string("nan") ||
          tmp_str == std::string("null")) {
Guolin Ke's avatar
Guolin Ke committed
339
        *out = NAN;
340
      } else if (tmp_str == std::string("inf") || tmp_str == std::string("infinity")) {
341
        *out = sign * 1e308;
342
      } else {
343
        Log::Fatal("Unknown token %s in data file", tmp_str.c_str());
Guolin Ke's avatar
Guolin Ke committed
344
345
      }
      p += cnt;
346
    }
Guolin Ke's avatar
Guolin Ke committed
347
  }
Guolin Ke's avatar
Guolin Ke committed
348

Guolin Ke's avatar
Guolin Ke committed
349
350
351
  while (*p == ' ') {
    ++p;
  }
Guolin Ke's avatar
Guolin Ke committed
352

Guolin Ke's avatar
Guolin Ke committed
353
354
355
  return p;
}

Chen Yufei's avatar
Chen Yufei committed
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
// Use fast_double_parse and strtod (if parse failed) to parse double.
inline static const char* AtofPrecise(const char* p, double* out) {
  const char* end = fast_double_parser::parse_number(p, out);

  if (end != nullptr) {
    return end;
  }

  // Rare path: Not in RFC 7159 format. Possible "inf", "nan", etc. Fallback to standard library:
  char* end2;
  errno = 0;  // This is Required before calling strtod.
  *out = std::strtod(p, &end2);  // strtod is locale aware.
  if (end2 == p) {
    Log::Fatal("no conversion to double for: %s", p);
  }
  if (errno == ERANGE) {
372
    Log::Warning("convert to double got underflow or overflow: %s", p);
Chen Yufei's avatar
Chen Yufei committed
373
374
375
376
  }
  return end2;
}

377
inline static bool AtoiAndCheck(const char* p, int* out) {
378
379
380
381
382
383
384
  const char* after = Atoi(p, out);
  if (*after != '\0') {
    return false;
  }
  return true;
}

385
inline static bool AtofAndCheck(const char* p, double* out) {
386
387
388
389
390
391
392
  const char* after = Atof(p, out);
  if (*after != '\0') {
    return false;
  }
  return true;
}

Guolin Ke's avatar
Guolin Ke committed
393
394
395
396
397
398
399
400
401
402
403
404
405
406
inline static const char* SkipSpaceAndTab(const char* p) {
  while (*p == ' ' || *p == '\t') {
    ++p;
  }
  return p;
}

inline static const char* SkipReturn(const char* p) {
  while (*p == '\n' || *p == '\r' || *p == ' ') {
    ++p;
  }
  return p;
}

Guolin Ke's avatar
Guolin Ke committed
407
408
template<typename T, typename T2>
inline static std::vector<T2> ArrayCast(const std::vector<T>& arr) {
409
  std::vector<T2> ret(arr.size());
Guolin Ke's avatar
Guolin Ke committed
410
  for (size_t i = 0; i < arr.size(); ++i) {
411
    ret[i] = static_cast<T2>(arr[i]);
Guolin Ke's avatar
Guolin Ke committed
412
  }
Guolin Ke's avatar
Guolin Ke committed
413
  return ret;
Guolin Ke's avatar
Guolin Ke committed
414
415
}

416
417
418
template<typename T, bool is_float>
struct __StringToTHelper {
  T operator()(const std::string& str) const {
419
420
421
    T ret = 0;
    Atoi(str.c_str(), &ret);
    return ret;
422
423
424
425
426
427
428
429
430
431
  }
};

template<typename T>
struct __StringToTHelper<T, true> {
  T operator()(const std::string& str) const {
    return static_cast<T>(std::stod(str));
  }
};

Guolin Ke's avatar
Guolin Ke committed
432
template<typename T>
433
inline static std::vector<T> StringToArray(const std::string& str, char delimiter) {
Guolin Ke's avatar
Guolin Ke committed
434
  std::vector<std::string> strs = Split(str.c_str(), delimiter);
435
436
  std::vector<T> ret;
  ret.reserve(strs.size());
437
  __StringToTHelper<T, std::is_floating_point<T>::value> helper;
438
439
  for (const auto& s : strs) {
    ret.push_back(helper(s));
Guolin Ke's avatar
Guolin Ke committed
440
441
442
443
  }
  return ret;
}

444
445
446
447
448
449
450
451
452
453
454
template<typename T>
inline static std::vector<std::vector<T>> StringToArrayofArrays(
    const std::string& str, char left_bracket, char right_bracket, char delimiter) {
  std::vector<std::string> strs = SplitBrackets(str.c_str(), left_bracket, right_bracket);
  std::vector<std::vector<T>> ret;
  for (const auto& s : strs) {
    ret.push_back(StringToArray<T>(s, delimiter));
  }
  return ret;
}

Guolin Ke's avatar
Guolin Ke committed
455
template<typename T>
456
457
458
459
460
inline static std::vector<T> StringToArray(const std::string& str, int n) {
  if (n == 0) {
    return std::vector<T>();
  }
  std::vector<std::string> strs = Split(str.c_str(), ' ');
Nikita Titov's avatar
Nikita Titov committed
461
  CHECK_EQ(strs.size(), static_cast<size_t>(n));
Guolin Ke's avatar
Guolin Ke committed
462
  std::vector<T> ret;
463
464
465
466
  ret.reserve(strs.size());
  __StringToTHelper<T, std::is_floating_point<T>::value> helper;
  for (const auto& s : strs) {
    ret.push_back(helper(s));
Guolin Ke's avatar
Guolin Ke committed
467
468
469
470
  }
  return ret;
}

471
472
473
474
475
476
477
478
479
480
481
482
template<typename T, bool is_float>
struct __StringToTHelperFast {
  const char* operator()(const char*p, T* out) const {
    return Atoi(p, out);
  }
};

template<typename T>
struct __StringToTHelperFast<T, true> {
  const char* operator()(const char*p, T* out) const {
    double tmp = 0.0f;
    auto ret = Atof(p, &tmp);
483
    *out = static_cast<T>(tmp);
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
    return ret;
  }
};

template<typename T>
inline static std::vector<T> StringToArrayFast(const std::string& str, int n) {
  if (n == 0) {
    return std::vector<T>();
  }
  auto p_str = str.c_str();
  __StringToTHelperFast<T, std::is_floating_point<T>::value> helper;
  std::vector<T> ret(n);
  for (int i = 0; i < n; ++i) {
    p_str = helper(p_str, &ret[i]);
  }
  return ret;
}

502
template<typename T>
503
inline static std::string Join(const std::vector<T>& strs, const char* delimiter, const bool force_C_locale = false) {
Guolin Ke's avatar
Guolin Ke committed
504
  if (strs.empty()) {
Guolin Ke's avatar
Guolin Ke committed
505
506
    return std::string("");
  }
507
  std::stringstream str_buf;
508
509
510
  if (force_C_locale) {
    C_stringstream(str_buf);
  }
511
  str_buf << std::setprecision(std::numeric_limits<double>::digits10 + 2);
512
  str_buf << strs[0];
Guolin Ke's avatar
Guolin Ke committed
513
  for (size_t i = 1; i < strs.size(); ++i) {
514
515
    str_buf << delimiter;
    str_buf << strs[i];
Guolin Ke's avatar
Guolin Ke committed
516
  }
517
  return str_buf.str();
Guolin Ke's avatar
Guolin Ke committed
518
519
}

520
template<>
521
inline std::string Join<int8_t>(const std::vector<int8_t>& strs, const char* delimiter, const bool force_C_locale) {
522
523
524
525
  if (strs.empty()) {
    return std::string("");
  }
  std::stringstream str_buf;
526
527
528
  if (force_C_locale) {
    C_stringstream(str_buf);
  }
529
530
531
532
533
534
535
536
537
  str_buf << std::setprecision(std::numeric_limits<double>::digits10 + 2);
  str_buf << static_cast<int16_t>(strs[0]);
  for (size_t i = 1; i < strs.size(); ++i) {
    str_buf << delimiter;
    str_buf << static_cast<int16_t>(strs[i]);
  }
  return str_buf.str();
}

538
template<typename T>
539
inline static std::string Join(const std::vector<T>& strs, size_t start, size_t end, const char* delimiter, const bool force_C_locale = false) {
Guolin Ke's avatar
Guolin Ke committed
540
541
542
  if (end - start <= 0) {
    return std::string("");
  }
Guolin Ke's avatar
Guolin Ke committed
543
544
  start = std::min(start, static_cast<size_t>(strs.size()) - 1);
  end = std::min(end, static_cast<size_t>(strs.size()));
545
  std::stringstream str_buf;
546
547
548
  if (force_C_locale) {
    C_stringstream(str_buf);
  }
549
  str_buf << std::setprecision(std::numeric_limits<double>::digits10 + 2);
550
  str_buf << strs[start];
Guolin Ke's avatar
Guolin Ke committed
551
  for (size_t i = start + 1; i < end; ++i) {
552
553
    str_buf << delimiter;
    str_buf << strs[i];
Guolin Ke's avatar
Guolin Ke committed
554
  }
555
  return str_buf.str();
Guolin Ke's avatar
Guolin Ke committed
556
557
}

558
inline static int64_t Pow2RoundUp(int64_t x) {
Guolin Ke's avatar
Guolin Ke committed
559
560
561
562
563
564
565
566
567
568
  int64_t t = 1;
  for (int i = 0; i < 64; ++i) {
    if (t >= x) {
      return t;
    }
    t <<= 1;
  }
  return 0;
}

569
/*!
570
 * \brief Do inplace softmax transformation on p_rec
571
572
 * \param p_rec The input/output vector of the values.
 */
573
inline static void Softmax(std::vector<double>* p_rec) {
574
575
  std::vector<double> &rec = *p_rec;
  double wmax = rec[0];
576
577
578
  for (size_t i = 1; i < rec.size(); ++i) {
    wmax = std::max(rec[i], wmax);
  }
579
  double wsum = 0.0f;
580
581
582
583
584
  for (size_t i = 0; i < rec.size(); ++i) {
    rec[i] = std::exp(rec[i] - wmax);
    wsum += rec[i];
  }
  for (size_t i = 0; i < rec.size(); ++i) {
585
    rec[i] /= static_cast<double>(wsum);
586
587
588
  }
}

589
inline static void Softmax(const double* input, double* output, int len) {
Guolin Ke's avatar
Guolin Ke committed
590
  double wmax = input[0];
591
  for (int i = 1; i < len; ++i) {
Guolin Ke's avatar
Guolin Ke committed
592
    wmax = std::max(input[i], wmax);
593
594
595
  }
  double wsum = 0.0f;
  for (int i = 0; i < len; ++i) {
Guolin Ke's avatar
Guolin Ke committed
596
597
    output[i] = std::exp(input[i] - wmax);
    wsum += output[i];
598
599
  }
  for (int i = 0; i < len; ++i) {
Guolin Ke's avatar
Guolin Ke committed
600
    output[i] /= static_cast<double>(wsum);
601
602
603
  }
}

Guolin Ke's avatar
Guolin Ke committed
604
605
606
template<typename T>
std::vector<const T*> ConstPtrInVectorWrapper(const std::vector<std::unique_ptr<T>>& input) {
  std::vector<const T*> ret;
Guolin Ke's avatar
Guolin Ke committed
607
608
  for (auto t = input.begin(); t !=input.end(); ++t) {
    ret.push_back(t->get());
609
  }
Guolin Ke's avatar
Guolin Ke committed
610
  return ret;
611
612
}

Guolin Ke's avatar
Guolin Ke committed
613
template<typename T1, typename T2>
Guolin Ke's avatar
Guolin Ke committed
614
inline static void SortForPair(std::vector<T1>* keys, std::vector<T2>* values, size_t start, bool is_reverse = false) {
Guolin Ke's avatar
Guolin Ke committed
615
  std::vector<std::pair<T1, T2>> arr;
Guolin Ke's avatar
Guolin Ke committed
616
617
  auto& ref_key = *keys;
  auto& ref_value = *values;
Guolin Ke's avatar
Guolin Ke committed
618
  for (size_t i = start; i < keys->size(); ++i) {
Guolin Ke's avatar
Guolin Ke committed
619
    arr.emplace_back(ref_key[i], ref_value[i]);
Guolin Ke's avatar
Guolin Ke committed
620
621
  }
  if (!is_reverse) {
622
    std::stable_sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
Guolin Ke's avatar
Guolin Ke committed
623
624
625
      return a.first < b.first;
    });
  } else {
626
    std::stable_sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
Guolin Ke's avatar
Guolin Ke committed
627
628
629
630
      return a.first > b.first;
    });
  }
  for (size_t i = start; i < arr.size(); ++i) {
Guolin Ke's avatar
Guolin Ke committed
631
632
    ref_key[i] = arr[i].first;
    ref_value[i] = arr[i].second;
Guolin Ke's avatar
Guolin Ke committed
633
634
635
  }
}

636
template <typename T>
Guolin Ke's avatar
Guolin Ke committed
637
638
inline static std::vector<T*> Vector2Ptr(std::vector<std::vector<T>>* data) {
  std::vector<T*> ptr(data->size());
Guolin Ke's avatar
Guolin Ke committed
639
  auto& ref_data = *data;
Guolin Ke's avatar
Guolin Ke committed
640
  for (size_t i = 0; i < data->size(); ++i) {
Guolin Ke's avatar
Guolin Ke committed
641
    ptr[i] = ref_data[i].data();
642
643
644
645
646
647
648
649
650
651
652
653
654
  }
  return ptr;
}

template <typename T>
inline static std::vector<int> VectorSize(const std::vector<std::vector<T>>& data) {
  std::vector<int> ret(data.size());
  for (size_t i = 0; i < data.size(); ++i) {
    ret[i] = static_cast<int>(data[i].size());
  }
  return ret;
}

Guolin Ke's avatar
Guolin Ke committed
655
inline static double AvoidInf(double x) {
Guolin Ke's avatar
Guolin Ke committed
656
657
658
  if (std::isnan(x)) {
    return 0.0;
  } else if (x >= 1e300) {
Guolin Ke's avatar
Guolin Ke committed
659
    return 1e300;
660
  } else if (x <= -1e300) {
Guolin Ke's avatar
Guolin Ke committed
661
    return -1e300;
Guolin Ke's avatar
Guolin Ke committed
662
663
664
665
666
  } else {
    return x;
  }
}

667
inline static float AvoidInf(float x) {
Guolin Ke's avatar
Guolin Ke committed
668
  if (std::isnan(x)) {
Guolin Ke's avatar
Guolin Ke committed
669
670
    return 0.0f;
  } else if (x >= 1e38) {
671
672
673
674
675
676
    return 1e38f;
  } else if (x <= -1e38) {
    return -1e38f;
  } else {
    return x;
  }
677
678
679
}

template<typename _Iter> inline
680
681
682
683
static typename std::iterator_traits<_Iter>::value_type* IteratorValType(_Iter) {
  return (0);
}

684
template<typename _RanIt, typename _Pr, typename _VTRanIt> inline
685
686
687
static void ParallelSort(_RanIt _First, _RanIt _Last, _Pr _Pred, _VTRanIt*) {
  size_t len = _Last - _First;
  const size_t kMinInnerLen = 1024;
688
  int num_threads = OMP_NUM_THREADS();
689
690
691
692
693
694
695
  if (len <= kMinInnerLen || num_threads <= 1) {
    std::sort(_First, _Last, _Pred);
    return;
  }
  size_t inner_size = (len + num_threads - 1) / num_threads;
  inner_size = std::max(inner_size, kMinInnerLen);
  num_threads = static_cast<int>((len + inner_size - 1) / inner_size);
696
#pragma omp parallel for schedule(static, 1)
697
698
699
700
701
702
703
704
705
706
707
  for (int i = 0; i < num_threads; ++i) {
    size_t left = inner_size*i;
    size_t right = left + inner_size;
    right = std::min(right, len);
    if (right > left) {
      std::sort(_First + left, _First + right, _Pred);
    }
  }
  // Buffer for merge.
  std::vector<_VTRanIt> temp_buf(len);
  _RanIt buf = temp_buf.begin();
708
  size_t s = inner_size;
709
710
711
  // Recursive merge
  while (s < len) {
    int loop_size = static_cast<int>((len + s * 2 - 1) / (s * 2));
712
    #pragma omp parallel for schedule(static, 1)
713
714
715
716
717
    for (int i = 0; i < loop_size; ++i) {
      size_t left = i * 2 * s;
      size_t mid = left + s;
      size_t right = mid + s;
      right = std::min(len, right);
Guolin Ke's avatar
Guolin Ke committed
718
      if (mid >= right) { continue; }
719
720
721
722
723
724
725
      std::copy(_First + left, _First + mid, buf + left);
      std::merge(buf + left, buf + mid, _First + mid, _First + right, _First + left, _Pred);
    }
    s *= 2;
  }
}

726
template<typename _RanIt, typename _Pr> inline
727
728
729
730
static void ParallelSort(_RanIt _First, _RanIt _Last, _Pr _Pred) {
  return ParallelSort(_First, _Last, _Pred, IteratorValType(_First));
}

731
// Check that all y[] are in interval [ymin, ymax] (end points included); throws error if not
732
template <typename T>
733
inline static void CheckElementsIntervalClosed(const T *y, T ymin, T ymax, int ny, const char *callername) {
734
  auto fatal_msg = [&y, &ymin, &ymax, &callername](int i) {
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
    std::ostringstream os;
    os << "[%s]: does not tolerate element [#%i = " << y[i] << "] outside [" << ymin << ", " << ymax << "]";
    Log::Fatal(os.str().c_str(), callername, i);
  };
  for (int i = 1; i < ny; i += 2) {
    if (y[i - 1] < y[i]) {
      if (y[i - 1] < ymin) {
        fatal_msg(i - 1);
      } else if (y[i] > ymax) {
        fatal_msg(i);
      }
    } else {
      if (y[i - 1] > ymax) {
        fatal_msg(i - 1);
      } else if (y[i] < ymin) {
        fatal_msg(i);
      }
    }
  }
754
  if (ny & 1) {  // odd
755
756
    if (y[ny - 1] < ymin || y[ny - 1] > ymax) {
      fatal_msg(ny - 1);
757
758
759
760
761
762
    }
  }
}

// One-pass scan over array w with nw elements: find min, max and sum of elements;
// this is useful for checking weight requirements.
763
template <typename T1, typename T2>
764
inline static void ObtainMinMaxSum(const T1 *w, int nw, T1 *mi, T1 *ma, T2 *su) {
765
766
767
768
  T1 minw;
  T1 maxw;
  T1 sumw;
  int i;
769
  if (nw & 1) {  // odd
770
771
772
773
    minw = w[0];
    maxw = w[0];
    sumw = w[0];
    i = 2;
774
  } else {  // even
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
    if (w[0] < w[1]) {
      minw = w[0];
      maxw = w[1];
    } else {
      minw = w[1];
      maxw = w[0];
    }
    sumw = w[0] + w[1];
    i = 3;
  }
  for (; i < nw; i += 2) {
    if (w[i - 1] < w[i]) {
      minw = std::min(minw, w[i - 1]);
      maxw = std::max(maxw, w[i]);
    } else {
      minw = std::min(minw, w[i]);
      maxw = std::max(maxw, w[i - 1]);
    }
    sumw += w[i - 1] + w[i];
  }
  if (mi != nullptr) {
    *mi = minw;
  }
  if (ma != nullptr) {
    *ma = maxw;
  }
  if (su != nullptr) {
    *su = static_cast<T2>(sumw);
  }
804
805
}

806
inline static std::vector<uint32_t> EmptyBitset(int n) {
807
  int size = n / 32;
808
  if (n % 32 != 0) ++size;
809
810
811
812
  return std::vector<uint32_t>(size);
}

template<typename T>
Guolin Ke's avatar
Guolin Ke committed
813
inline static void InsertBitset(std::vector<uint32_t>* vec, const T val) {
Guolin Ke's avatar
Guolin Ke committed
814
815
816
817
818
819
820
  auto& ref_v = *vec;
  int i1 = val / 32;
  int i2 = val % 32;
  if (static_cast<int>(vec->size()) < i1 + 1) {
    vec->resize(i1 + 1, 0);
  }
  ref_v[i1] |= (1 << i2);
821
822
}

823
824
template<typename T>
inline static std::vector<uint32_t> ConstructBitset(const T* vals, int n) {
825
826
827
828
829
830
831
832
833
834
835
836
  std::vector<uint32_t> ret;
  for (int i = 0; i < n; ++i) {
    int i1 = vals[i] / 32;
    int i2 = vals[i] % 32;
    if (static_cast<int>(ret.size()) < i1 + 1) {
      ret.resize(i1 + 1, 0);
    }
    ret[i1] |= (1 << i2);
  }
  return ret;
}

837
838
template<typename T>
inline static bool FindInBitset(const uint32_t* bits, int n, T pos) {
839
840
841
842
843
844
845
846
  int i1 = pos / 32;
  if (i1 >= n) {
    return false;
  }
  int i2 = pos % 32;
  return (bits[i1] >> i2) & 1;
}

847
848
849
850
851
852
inline static bool CheckDoubleEqualOrdered(double a, double b) {
  double upper = std::nextafter(a, INFINITY);
  return b <= upper;
}

inline static double GetDoubleUpperBound(double a) {
Hongbin Shi's avatar
Hongbin Shi committed
853
  return std::nextafter(a, INFINITY);
854
855
}

856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
inline static size_t GetLine(const char* str) {
  auto start = str;
  while (*str != '\0' && *str != '\n' && *str != '\r') {
    ++str;
  }
  return str - start;
}

inline static const char* SkipNewLine(const char* str) {
  if (*str == '\r') {
    ++str;
  }
  if (*str == '\n') {
    ++str;
  }
  return str;
}

874
875
876
877
878
template <typename T>
static int Sign(T x) {
  return (x > T(0)) - (x < T(0));
}

Guolin Ke's avatar
Guolin Ke committed
879
880
881
882
883
884
885
886
887
template <typename T>
static T SafeLog(T x) {
  if (x > 0) {
    return std::log(x);
  } else {
    return -INFINITY;
  }
}

888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
inline bool CheckAllowedJSON(const std::string& s) {
  unsigned char char_code;
  for (auto c : s) {
    char_code = static_cast<unsigned char>(c);
    if (char_code == 34      // "
        || char_code == 44   // ,
        || char_code == 58   // :
        || char_code == 91   // [
        || char_code == 93   // ]
        || char_code == 123  // {
        || char_code == 125  // }
        ) {
      return false;
    }
  }
  return true;
}

906
907
908
909
910
911
inline int RoundInt(double x) {
  return static_cast<int>(x + 0.5f);
}

template <typename T, std::size_t N = 32>
class AlignmentAllocator {
912
 public:
913
914
915
916
917
918
919
920
921
922
  typedef T value_type;
  typedef std::size_t size_type;
  typedef std::ptrdiff_t difference_type;

  typedef T* pointer;
  typedef const T* const_pointer;

  typedef T& reference;
  typedef const T& const_reference;

923
  inline AlignmentAllocator() throw() {}
924
925

  template <typename T2>
926
  inline AlignmentAllocator(const AlignmentAllocator<T2, N>&) throw() {}
927

928
  inline ~AlignmentAllocator() throw() {}
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953

  inline pointer adress(reference r) {
    return &r;
  }

  inline const_pointer adress(const_reference r) const {
    return &r;
  }

  inline pointer allocate(size_type n) {
    return (pointer)_mm_malloc(n * sizeof(value_type), N);
  }

  inline void deallocate(pointer p, size_type) {
    _mm_free(p);
  }

  inline void construct(pointer p, const value_type& wert) {
    new (p) value_type(wert);
  }

  inline void destroy(pointer p) {
    p->~value_type();
  }

954
  inline size_type max_size() const throw() {
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
    return size_type(-1) / sizeof(value_type);
  }

  template <typename T2>
  struct rebind {
    typedef AlignmentAllocator<T2, N> other;
  };

  bool operator!=(const AlignmentAllocator<T, N>& other) const {
    return !(*this == other);
  }

  // Returns true if and only if storage allocated from *this
  // can be deallocated from other, and vice versa.
  // Always returns true for stateless allocators.
  bool operator==(const AlignmentAllocator<T, N>&) const {
    return true;
  }
};

class Timer {
 public:
Guolin Ke's avatar
Guolin Ke committed
977
978
  Timer() {
#ifdef TIMETAG
979
    int num_threads = OMP_NUM_THREADS();
Guolin Ke's avatar
Guolin Ke committed
980
981
982
    start_time_.resize(num_threads);
    stats_.resize(num_threads);
#endif  // TIMETAG
983
  }
984

Guolin Ke's avatar
Guolin Ke committed
985
986
987
  ~Timer() { Print(); }

#ifdef TIMETAG
988
  void Start(const std::string& name) {
Guolin Ke's avatar
Guolin Ke committed
989
990
    auto tid = omp_get_thread_num();
    start_time_[tid][name] = std::chrono::steady_clock::now();
991
  }
992

993
  void Stop(const std::string& name) {
Guolin Ke's avatar
Guolin Ke committed
994
995
996
997
    auto cur_time = std::chrono::steady_clock::now();
    auto tid = omp_get_thread_num();
    if (stats_[tid].find(name) == stats_[tid].end()) {
      stats_[tid][name] = std::chrono::duration<double, std::milli>(0);
998
    }
Guolin Ke's avatar
Guolin Ke committed
999
    stats_[tid][name] += cur_time - start_time_[tid][name];
1000
  }
1001

Guolin Ke's avatar
Guolin Ke committed
1002
1003
#else
  void Start(const std::string&) {}
1004

Guolin Ke's avatar
Guolin Ke committed
1005
1006
  void Stop(const std::string&) {}
#endif  // TIMETAG
1007
1008

  void Print() const {
Guolin Ke's avatar
Guolin Ke committed
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
#ifdef TIMETAG
    std::unordered_map<std::string, std::chrono::duration<double, std::milli>>
        stats(stats_[0].begin(), stats_[0].end());
    for (size_t i = 1; i < stats_.size(); ++i) {
      for (auto it = stats_[i].begin(); it != stats_[i].end(); ++it) {
        if (stats.find(it->first) == stats.end()) {
          stats[it->first] = it->second;
        } else {
          stats[it->first] += it->second;
        }
      }
    }
    std::map<std::string, std::chrono::duration<double, std::milli>> ordered(
        stats.begin(), stats.end());
1023
    for (auto it = ordered.begin(); it != ordered.end(); ++it) {
1024
      Log::Info("%s costs:\t %f", it->first.c_str(), it->second * 1e-3);
1025
    }
Guolin Ke's avatar
Guolin Ke committed
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
#endif  // TIMETAG
  }
#ifdef TIMETAG
  std::vector<
      std::unordered_map<std::string, std::chrono::steady_clock::time_point>>
      start_time_;
  std::vector<std::unordered_map<std::string,
                                 std::chrono::duration<double, std::milli>>>
      stats_;
#endif  // TIMETAG
1036
1037
1038
1039
1040
};

// Note: this class is not thread-safe, don't use it inside omp blocks
class FunctionTimer {
 public:
1041
#ifdef TIMETAG
Guolin Ke's avatar
Guolin Ke committed
1042
  FunctionTimer(const std::string& name, Timer& timer) : timer_(timer) {
1043
1044
1045
    timer.Start(name);
    name_ = name;
  }
1046

Guolin Ke's avatar
Guolin Ke committed
1047
  ~FunctionTimer() { timer_.Stop(name_); }
1048

1049
1050
1051
 private:
  std::string name_;
  Timer& timer_;
1052
1053
1054
#else
  FunctionTimer(const std::string&, Timer&) {}
#endif  // TIMETAG
1055
1056
};

Guolin Ke's avatar
Guolin Ke committed
1057
1058
}  // namespace Common

1059
1060
extern Common::Timer global_timer;

1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125

/*!
* Provides locale-independent alternatives to Common's methods.
* Essential to make models robust to locale settings.
*/
namespace CommonC {

template<typename T>
inline static std::string Join(const std::vector<T>& strs, const char* delimiter) {
  return LightGBM::Common::Join(strs, delimiter, true);
}

template<typename T>
inline static std::string Join(const std::vector<T>& strs, size_t start, size_t end, const char* delimiter) {
  return LightGBM::Common::Join(strs, start, end, delimiter, true);
}

inline static const char* Atof(const char* p, double* out) {
  return LightGBM::Common::Atof(p, out);
}

template<typename T, bool is_float>
struct __StringToTHelperFast {
  const char* operator()(const char*p, T* out) const {
    return LightGBM::Common::Atoi(p, out);
  }
};

/*!
* \warning Beware that ``Common::Atof`` in ``__StringToTHelperFast``,
*          has **less** floating point precision than ``__StringToTHelper``.
*          Both versions are kept to maintain bit-for-bit the "legacy" LightGBM behaviour in terms of precision.
*          Check ``StringToArrayFast`` and ``StringToArray`` for more details on this.
*/
template<typename T>
struct __StringToTHelperFast<T, true> {
  const char* operator()(const char*p, T* out) const {
    double tmp = 0.0f;
    auto ret = Atof(p, &tmp);
    *out = static_cast<T>(tmp);
    return ret;
  }
};

template<typename T, bool is_float>
struct __StringToTHelper {
  T operator()(const std::string& str) const {
    T ret = 0;
    LightGBM::Common::Atoi(str.c_str(), &ret);
    return ret;
  }
};

/*!
* \warning Beware that ``Common::Atof`` in ``__StringToTHelperFast``,
*          has **less** floating point precision than ``__StringToTHelper``.
*          Both versions are kept to maintain bit-for-bit the "legacy" LightGBM behaviour in terms of precision.
*          Check ``StringToArrayFast`` and ``StringToArray`` for more details on this.
* \note It is possible that ``fast_double_parser::parse_number`` is faster than ``Common::Atof``.
*/
template<typename T>
struct __StringToTHelper<T, true> {
  T operator()(const std::string& str) const {
    double tmp;

Chen Yufei's avatar
Chen Yufei committed
1126
1127
    const char* end = Common::AtofPrecise(str.c_str(), &tmp);
    if (end == str.c_str()) {
1128
        Log::Fatal("Failed to parse double: %s", str.c_str());
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
    }

    return static_cast<T>(tmp);
  }
};


/*!
* \warning Beware that due to internal use of ``Common::Atof`` in ``__StringToTHelperFast``,
*          this method has less precision for floating point numbers than ``StringToArray``,
*          which calls ``__StringToTHelper``.
*          As such, ``StringToArrayFast`` and ``StringToArray`` are not equivalent!
*          Both versions were kept to maintain bit-for-bit the "legacy" LightGBM behaviour in terms of precision.
*/
template<typename T>
inline static std::vector<T> StringToArrayFast(const std::string& str, int n) {
  if (n == 0) {
    return std::vector<T>();
  }
  auto p_str = str.c_str();
  __StringToTHelperFast<T, std::is_floating_point<T>::value> helper;
  std::vector<T> ret(n);
  for (int i = 0; i < n; ++i) {
    p_str = helper(p_str, &ret[i]);
  }
  return ret;
}

/*!
* \warning Do not replace calls to this method by ``StringToArrayFast``.
*          This method is more precise for floating point numbers.
*          Check ``StringToArrayFast`` for more details.
*/
template<typename T>
inline static std::vector<T> StringToArray(const std::string& str, int n) {
  if (n == 0) {
    return std::vector<T>();
  }
  std::vector<std::string> strs = LightGBM::Common::Split(str.c_str(), ' ');
  CHECK_EQ(strs.size(), static_cast<size_t>(n));
  std::vector<T> ret;
  ret.reserve(strs.size());
  __StringToTHelper<T, std::is_floating_point<T>::value> helper;
  for (const auto& s : strs) {
    ret.push_back(helper(s));
  }
  return ret;
}

/*!
* \warning Do not replace calls to this method by ``StringToArrayFast``.
*          This method is more precise for floating point numbers.
*          Check ``StringToArrayFast`` for more details.
*/
template<typename T>
inline static std::vector<T> StringToArray(const std::string& str, char delimiter) {
  std::vector<std::string> strs = LightGBM::Common::Split(str.c_str(), delimiter);
  std::vector<T> ret;
  ret.reserve(strs.size());
  __StringToTHelper<T, std::is_floating_point<T>::value> helper;
  for (const auto& s : strs) {
    ret.push_back(helper(s));
  }
  return ret;
}

#if (!((defined(sun) || defined(__sun)) && (defined(__SVR4) || defined(__svr4__))))
/*!
* Safely formats a value onto a buffer according to a format string and null-terminates it.
*
* \note It checks that the full value was written or forcefully aborts.
*       This safety check serves to prevent incorrect internal API usage.
*       Correct usage will never incur in this problem:
*         - The received buffer size shall be sufficient at all times for the input format string and value.
*/
template <typename T>
inline static void format_to_buf(char* buffer, const size_t buf_len, const char* format, const T value) {
    auto result = fmt::format_to_n(buffer, buf_len, format, value);
    if (result.size >= buf_len) {
      Log::Fatal("Numerical conversion failed. Buffer is too small.");
    }
    buffer[result.size] = '\0';
}

template<typename T, bool is_float, bool high_precision>
struct __TToStringHelper {
  void operator()(T value, char* buffer, size_t buf_len) const {
    format_to_buf(buffer, buf_len, "{}", value);
  }
};

template<typename T>
struct __TToStringHelper<T, true, false> {
  void operator()(T value, char* buffer, size_t buf_len) const {
    format_to_buf(buffer, buf_len, "{:g}", value);
  }
};

template<typename T>
struct __TToStringHelper<T, true, true> {
  void operator()(T value, char* buffer, size_t buf_len) const {
    format_to_buf(buffer, buf_len, "{:.17g}", value);
  }
};

/*!
* Converts an array to a string with with values separated by the space character.
* This method replaces Common's ``ArrayToString`` and ``ArrayToStringFast`` functionality
* and is locale-independent.
* 
* \note If ``high_precision_output`` is set to true,
*       floating point values are output with more digits of precision.
*/
template<bool high_precision_output = false, typename T>
inline static std::string ArrayToString(const std::vector<T>& arr, size_t n) {
  if (arr.empty() || n == 0) {
    return std::string("");
  }
  __TToStringHelper<T, std::is_floating_point<T>::value, high_precision_output> helper;
  const size_t buf_len = high_precision_output ? 32 : 16;
  std::vector<char> buffer(buf_len);
  std::stringstream str_buf;
  Common::C_stringstream(str_buf);
  helper(arr[0], buffer.data(), buf_len);
  str_buf << buffer.data();
  for (size_t i = 1; i < std::min(n, arr.size()); ++i) {
    helper(arr[i], buffer.data(), buf_len);
    str_buf << ' ' << buffer.data();
  }
  return str_buf.str();
}
#endif  // (!((defined(sun) || defined(__sun)) && (defined(__SVR4) || defined(__svr4__))))


}  // namespace CommonC


Guolin Ke's avatar
Guolin Ke committed
1266
1267
}  // namespace LightGBM

1268
#endif  // LIGHTGBM_UTILS_COMMON_H_