// Protocol Buffers - Google's data interchange format // Copyright 2023 Google LLC. All rights reserved. // https://developers.google.com/protocol-buffers/ // // Redistribution and use in source and binary forms, with or without // modification, are permitted provided that the following conditions are // met: // // * Redistributions of source code must retain the above copyright // notice, this list of conditions and the following disclaimer. // * Redistributions in binary form must reproduce the above // copyright notice, this list of conditions and the following disclaimer // in the documentation and/or other materials provided with the // distribution. // * Neither the name of Google LLC nor the names of its // contributors may be used to endorse or promote products derived from // this software without specific prior written permission. // // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. #include "upb/lex/strtod.h" #include #include // Must be last. #include "upb/port/def.inc" // Determine the locale-specific radix character by calling sprintf() to print // the number 1.5, then stripping off the digits. As far as I can tell, this // is the only portable, thread-safe way to get the C library to divulge the // locale's radix character. No, localeconv() is NOT thread-safe. static int GetLocaleRadix(char *data, size_t capacity) { char temp[16]; const int size = snprintf(temp, sizeof(temp), "%.1f", 1.5); UPB_ASSERT(temp[0] == '1'); UPB_ASSERT(temp[size - 1] == '5'); UPB_ASSERT(size < capacity); temp[size - 1] = '\0'; strcpy(data, temp + 1); return size - 2; } // Populates a string identical to *input except that the character pointed to // by pos (which should be '.') is replaced with the locale-specific radix. static void LocalizeRadix(const char *input, const char *pos, char *output) { const int len1 = pos - input; char radix[8]; const int len2 = GetLocaleRadix(radix, sizeof(radix)); memcpy(output, input, len1); memcpy(output + len1, radix, len2); strcpy(output + len1 + len2, input + len1 + 1); } double _upb_NoLocaleStrtod(const char *str, char **endptr) { // We cannot simply set the locale to "C" temporarily with setlocale() // as this is not thread-safe. Instead, we try to parse in the current // locale first. If parsing stops at a '.' character, then this is a // pretty good hint that we're actually in some other locale in which // '.' is not the radix character. char *temp_endptr; double result = strtod(str, &temp_endptr); if (endptr != NULL) *endptr = temp_endptr; if (*temp_endptr != '.') return result; // Parsing halted on a '.'. Perhaps we're in a different locale? Let's // try to replace the '.' with a locale-specific radix character and // try again. char localized[80]; LocalizeRadix(str, temp_endptr, localized); char *localized_endptr; result = strtod(localized, &localized_endptr); if ((localized_endptr - &localized[0]) > (temp_endptr - str)) { // This attempt got further, so replacing the decimal must have helped. // Update endptr to point at the right location. if (endptr != NULL) { // size_diff is non-zero if the localized radix has multiple bytes. int size_diff = strlen(localized) - strlen(str); *endptr = (char *)str + (localized_endptr - &localized[0] - size_diff); } } return result; }