]>
Commit | Line | Data |
---|---|---|
7c673cae | 1 | // Copyright (c) 2011-present, Facebook, Inc. All rights reserved. |
11fdf7f2 TL |
2 | // This source code is licensed under both the GPLv2 (found in the |
3 | // COPYING file in the root directory) and Apache 2.0 License | |
4 | // (found in the LICENSE.Apache file in the root directory). | |
7c673cae FG |
5 | // |
6 | #include "util/string_util.h" | |
7 | ||
8 | #ifndef __STDC_FORMAT_MACROS | |
9 | #define __STDC_FORMAT_MACROS | |
10 | #endif | |
11 | ||
12 | #include <errno.h> | |
13 | #include <inttypes.h> | |
14 | #include <stdarg.h> | |
15 | #include <stdio.h> | |
16 | #include <stdlib.h> | |
17 | #include <algorithm> | |
18 | #include <cmath> | |
19 | #include <sstream> | |
20 | #include <string> | |
21 | #include <utility> | |
22 | #include <vector> | |
23 | #include "rocksdb/env.h" | |
24 | #include "rocksdb/slice.h" | |
25 | ||
26 | namespace rocksdb { | |
27 | ||
28 | const std::string kNullptrString = "nullptr"; | |
29 | ||
30 | std::vector<std::string> StringSplit(const std::string& arg, char delim) { | |
31 | std::vector<std::string> splits; | |
32 | std::stringstream ss(arg); | |
33 | std::string item; | |
34 | while (std::getline(ss, item, delim)) { | |
35 | splits.push_back(item); | |
36 | } | |
37 | return splits; | |
38 | } | |
39 | ||
40 | // for micros < 10ms, print "XX us". | |
41 | // for micros < 10sec, print "XX ms". | |
42 | // for micros >= 10 sec, print "XX sec". | |
43 | // for micros <= 1 hour, print Y:X M:S". | |
44 | // for micros > 1 hour, print Z:Y:X H:M:S". | |
45 | int AppendHumanMicros(uint64_t micros, char* output, int len, | |
46 | bool fixed_format) { | |
47 | if (micros < 10000 && !fixed_format) { | |
48 | return snprintf(output, len, "%" PRIu64 " us", micros); | |
49 | } else if (micros < 10000000 && !fixed_format) { | |
50 | return snprintf(output, len, "%.3lf ms", | |
51 | static_cast<double>(micros) / 1000); | |
52 | } else if (micros < 1000000l * 60 && !fixed_format) { | |
53 | return snprintf(output, len, "%.3lf sec", | |
54 | static_cast<double>(micros) / 1000000); | |
55 | } else if (micros < 1000000ll * 60 * 60 && !fixed_format) { | |
56 | return snprintf(output, len, "%02" PRIu64 ":%05.3f M:S", | |
57 | micros / 1000000 / 60, | |
58 | static_cast<double>(micros % 60000000) / 1000000); | |
59 | } else { | |
60 | return snprintf(output, len, "%02" PRIu64 ":%02" PRIu64 ":%05.3f H:M:S", | |
61 | micros / 1000000 / 3600, (micros / 1000000 / 60) % 60, | |
62 | static_cast<double>(micros % 60000000) / 1000000); | |
63 | } | |
64 | } | |
65 | ||
66 | // for sizes >=10TB, print "XXTB" | |
67 | // for sizes >=10GB, print "XXGB" | |
68 | // etc. | |
69 | // append file size summary to output and return the len | |
70 | int AppendHumanBytes(uint64_t bytes, char* output, int len) { | |
71 | const uint64_t ull10 = 10; | |
72 | if (bytes >= ull10 << 40) { | |
73 | return snprintf(output, len, "%" PRIu64 "TB", bytes >> 40); | |
74 | } else if (bytes >= ull10 << 30) { | |
75 | return snprintf(output, len, "%" PRIu64 "GB", bytes >> 30); | |
76 | } else if (bytes >= ull10 << 20) { | |
77 | return snprintf(output, len, "%" PRIu64 "MB", bytes >> 20); | |
78 | } else if (bytes >= ull10 << 10) { | |
79 | return snprintf(output, len, "%" PRIu64 "KB", bytes >> 10); | |
80 | } else { | |
81 | return snprintf(output, len, "%" PRIu64 "B", bytes); | |
82 | } | |
83 | } | |
84 | ||
85 | void AppendNumberTo(std::string* str, uint64_t num) { | |
86 | char buf[30]; | |
87 | snprintf(buf, sizeof(buf), "%" PRIu64, num); | |
88 | str->append(buf); | |
89 | } | |
90 | ||
91 | void AppendEscapedStringTo(std::string* str, const Slice& value) { | |
92 | for (size_t i = 0; i < value.size(); i++) { | |
93 | char c = value[i]; | |
94 | if (c >= ' ' && c <= '~') { | |
95 | str->push_back(c); | |
96 | } else { | |
97 | char buf[10]; | |
98 | snprintf(buf, sizeof(buf), "\\x%02x", | |
99 | static_cast<unsigned int>(c) & 0xff); | |
100 | str->append(buf); | |
101 | } | |
102 | } | |
103 | } | |
104 | ||
105 | std::string NumberToString(uint64_t num) { | |
106 | std::string r; | |
107 | AppendNumberTo(&r, num); | |
108 | return r; | |
109 | } | |
110 | ||
111 | std::string NumberToHumanString(int64_t num) { | |
112 | char buf[19]; | |
113 | int64_t absnum = num < 0 ? -num : num; | |
114 | if (absnum < 10000) { | |
115 | snprintf(buf, sizeof(buf), "%" PRIi64, num); | |
116 | } else if (absnum < 10000000) { | |
117 | snprintf(buf, sizeof(buf), "%" PRIi64 "K", num / 1000); | |
118 | } else if (absnum < 10000000000LL) { | |
119 | snprintf(buf, sizeof(buf), "%" PRIi64 "M", num / 1000000); | |
120 | } else { | |
121 | snprintf(buf, sizeof(buf), "%" PRIi64 "G", num / 1000000000); | |
122 | } | |
123 | return std::string(buf); | |
124 | } | |
125 | ||
126 | std::string BytesToHumanString(uint64_t bytes) { | |
127 | const char* size_name[] = {"KB", "MB", "GB", "TB"}; | |
128 | double final_size = static_cast<double>(bytes); | |
129 | size_t size_idx; | |
130 | ||
131 | // always start with KB | |
132 | final_size /= 1024; | |
133 | size_idx = 0; | |
134 | ||
135 | while (size_idx < 3 && final_size >= 1024) { | |
136 | final_size /= 1024; | |
137 | size_idx++; | |
138 | } | |
139 | ||
140 | char buf[20]; | |
141 | snprintf(buf, sizeof(buf), "%.2f %s", final_size, size_name[size_idx]); | |
142 | return std::string(buf); | |
143 | } | |
144 | ||
145 | std::string EscapeString(const Slice& value) { | |
146 | std::string r; | |
147 | AppendEscapedStringTo(&r, value); | |
148 | return r; | |
149 | } | |
150 | ||
151 | bool ConsumeDecimalNumber(Slice* in, uint64_t* val) { | |
152 | uint64_t v = 0; | |
153 | int digits = 0; | |
154 | while (!in->empty()) { | |
155 | char c = (*in)[0]; | |
156 | if (c >= '0' && c <= '9') { | |
157 | ++digits; | |
158 | const unsigned int delta = (c - '0'); | |
159 | static const uint64_t kMaxUint64 = ~static_cast<uint64_t>(0); | |
160 | if (v > kMaxUint64 / 10 || | |
161 | (v == kMaxUint64 / 10 && delta > kMaxUint64 % 10)) { | |
162 | // Overflow | |
163 | return false; | |
164 | } | |
165 | v = (v * 10) + delta; | |
166 | in->remove_prefix(1); | |
167 | } else { | |
168 | break; | |
169 | } | |
170 | } | |
171 | *val = v; | |
172 | return (digits > 0); | |
173 | } | |
174 | ||
175 | bool isSpecialChar(const char c) { | |
176 | if (c == '\\' || c == '#' || c == ':' || c == '\r' || c == '\n') { | |
177 | return true; | |
178 | } | |
179 | return false; | |
180 | } | |
181 | ||
182 | namespace { | |
183 | using CharMap = std::pair<char, char>; | |
184 | } | |
185 | ||
186 | char UnescapeChar(const char c) { | |
187 | static const CharMap convert_map[] = {{'r', '\r'}, {'n', '\n'}}; | |
188 | ||
189 | auto iter = std::find_if(std::begin(convert_map), std::end(convert_map), | |
190 | [c](const CharMap& p) { return p.first == c; }); | |
191 | ||
192 | if (iter == std::end(convert_map)) { | |
193 | return c; | |
194 | } | |
195 | return iter->second; | |
196 | } | |
197 | ||
198 | char EscapeChar(const char c) { | |
199 | static const CharMap convert_map[] = {{'\n', 'n'}, {'\r', 'r'}}; | |
200 | ||
201 | auto iter = std::find_if(std::begin(convert_map), std::end(convert_map), | |
202 | [c](const CharMap& p) { return p.first == c; }); | |
203 | ||
204 | if (iter == std::end(convert_map)) { | |
205 | return c; | |
206 | } | |
207 | return iter->second; | |
208 | } | |
209 | ||
210 | std::string EscapeOptionString(const std::string& raw_string) { | |
211 | std::string output; | |
212 | for (auto c : raw_string) { | |
213 | if (isSpecialChar(c)) { | |
214 | output += '\\'; | |
215 | output += EscapeChar(c); | |
216 | } else { | |
217 | output += c; | |
218 | } | |
219 | } | |
220 | ||
221 | return output; | |
222 | } | |
223 | ||
224 | std::string UnescapeOptionString(const std::string& escaped_string) { | |
225 | bool escaped = false; | |
226 | std::string output; | |
227 | ||
228 | for (auto c : escaped_string) { | |
229 | if (escaped) { | |
230 | output += UnescapeChar(c); | |
231 | escaped = false; | |
232 | } else { | |
233 | if (c == '\\') { | |
234 | escaped = true; | |
235 | continue; | |
236 | } | |
237 | output += c; | |
238 | } | |
239 | } | |
240 | return output; | |
241 | } | |
242 | ||
243 | std::string trim(const std::string& str) { | |
244 | if (str.empty()) return std::string(); | |
245 | size_t start = 0; | |
246 | size_t end = str.size() - 1; | |
11fdf7f2 | 247 | while (isspace(str[start]) != 0 && start < end) { |
7c673cae FG |
248 | ++start; |
249 | } | |
11fdf7f2 | 250 | while (isspace(str[end]) != 0 && start < end) { |
7c673cae FG |
251 | --end; |
252 | } | |
253 | if (start <= end) { | |
254 | return str.substr(start, end - start + 1); | |
255 | } | |
256 | return std::string(); | |
257 | } | |
258 | ||
259 | #ifndef ROCKSDB_LITE | |
260 | ||
261 | bool ParseBoolean(const std::string& type, const std::string& value) { | |
262 | if (value == "true" || value == "1") { | |
263 | return true; | |
264 | } else if (value == "false" || value == "0") { | |
265 | return false; | |
266 | } | |
267 | throw std::invalid_argument(type); | |
268 | } | |
269 | ||
270 | uint32_t ParseUint32(const std::string& value) { | |
271 | uint64_t num = ParseUint64(value); | |
272 | if ((num >> 32LL) == 0) { | |
273 | return static_cast<uint32_t>(num); | |
274 | } else { | |
275 | throw std::out_of_range(value); | |
276 | } | |
277 | } | |
278 | ||
279 | #endif | |
280 | ||
281 | uint64_t ParseUint64(const std::string& value) { | |
282 | size_t endchar; | |
283 | #ifndef CYGWIN | |
284 | uint64_t num = std::stoull(value.c_str(), &endchar); | |
285 | #else | |
286 | char* endptr; | |
287 | uint64_t num = std::strtoul(value.c_str(), &endptr, 0); | |
288 | endchar = endptr - value.c_str(); | |
289 | #endif | |
290 | ||
291 | if (endchar < value.length()) { | |
292 | char c = value[endchar]; | |
293 | if (c == 'k' || c == 'K') | |
294 | num <<= 10LL; | |
295 | else if (c == 'm' || c == 'M') | |
296 | num <<= 20LL; | |
297 | else if (c == 'g' || c == 'G') | |
298 | num <<= 30LL; | |
299 | else if (c == 't' || c == 'T') | |
300 | num <<= 40LL; | |
301 | } | |
302 | ||
303 | return num; | |
304 | } | |
305 | ||
306 | int ParseInt(const std::string& value) { | |
307 | size_t endchar; | |
308 | #ifndef CYGWIN | |
309 | int num = std::stoi(value.c_str(), &endchar); | |
310 | #else | |
311 | char* endptr; | |
312 | int num = std::strtoul(value.c_str(), &endptr, 0); | |
313 | endchar = endptr - value.c_str(); | |
314 | #endif | |
315 | ||
316 | if (endchar < value.length()) { | |
317 | char c = value[endchar]; | |
318 | if (c == 'k' || c == 'K') | |
319 | num <<= 10; | |
320 | else if (c == 'm' || c == 'M') | |
321 | num <<= 20; | |
322 | else if (c == 'g' || c == 'G') | |
323 | num <<= 30; | |
324 | } | |
325 | ||
326 | return num; | |
327 | } | |
328 | ||
329 | double ParseDouble(const std::string& value) { | |
330 | #ifndef CYGWIN | |
331 | return std::stod(value); | |
332 | #else | |
333 | return std::strtod(value.c_str(), 0); | |
334 | #endif | |
335 | } | |
336 | ||
337 | size_t ParseSizeT(const std::string& value) { | |
338 | return static_cast<size_t>(ParseUint64(value)); | |
339 | } | |
340 | ||
341 | std::vector<int> ParseVectorInt(const std::string& value) { | |
342 | std::vector<int> result; | |
343 | size_t start = 0; | |
344 | while (start < value.size()) { | |
345 | size_t end = value.find(':', start); | |
346 | if (end == std::string::npos) { | |
347 | result.push_back(ParseInt(value.substr(start))); | |
348 | break; | |
349 | } else { | |
350 | result.push_back(ParseInt(value.substr(start, end - start))); | |
351 | start = end + 1; | |
352 | } | |
353 | } | |
354 | return result; | |
355 | } | |
356 | ||
357 | bool SerializeIntVector(const std::vector<int>& vec, std::string* value) { | |
358 | *value = ""; | |
359 | for (size_t i = 0; i < vec.size(); ++i) { | |
360 | if (i > 0) { | |
361 | *value += ":"; | |
362 | } | |
363 | *value += ToString(vec[i]); | |
364 | } | |
365 | return true; | |
366 | } | |
367 | ||
368 | } // namespace rocksdb |