2024-12-05 21:14:30 -05:00 · 2024-12-05 21:14:30 -05:00 · 1120beb52e
commit 1120beb52e
parent 4d8fea7f32
9 changed files with 3979 additions and 21 deletions
--- a/epan/ftypes/ftype-double.c
+++ b/epan/ftypes/ftype-double.c
@ -11,6 +11,7 @@
 #include <ftypes-int.h>
 #include <float.h>
 #include <wsutil/array.h>
+#include <wsutil/dtoa.h>

 static void
 double_fvalue_new(fvalue_t *fv)
@ -56,20 +57,26 @@ float_val_to_repr(wmem_allocator_t *scope, const fvalue_t *fv, ftrepr_t rtype, i
 {
 	char *buf = wmem_alloc(scope, G_ASCII_DTOSTR_BUF_SIZE);
 	if (rtype == FTREPR_DFILTER)
-		g_ascii_dtostr(buf, G_ASCII_DTOSTR_BUF_SIZE, fv->value.floating);
+		dtoa_g_fmt(buf, fv->value.floating);
 	else
-		g_ascii_formatd(buf, G_ASCII_DTOSTR_BUF_SIZE, "%." G_STRINGIFY(FLT_DIG) "g", fv->value.floating);
+		g_ascii_formatd(buf, G_ASCII_DTOSTR_BUF_SIZE, "%." G_STRINGIFY(FLT_DECIMAL_DIG) "g", fv->value.floating);
 	return buf;
 }

 static char *
-double_val_to_repr(wmem_allocator_t *scope, const fvalue_t *fv, ftrepr_t rtype, int field_display _U_)
+double_val_to_repr(wmem_allocator_t *scope, const fvalue_t *fv, ftrepr_t rtype _U_, int field_display _U_)
 {
+	/* XXX - We prefer the g fmt here because it's always exact enough for
+	 * serialization and equality testing. We could also use dtoa to write
+	 * an acceptable for serialization and testing BASE_EXP format. We
+	 * could output in hex floating point if field_display is BASE_HEX as
+	 * it's always exact too, but less widely supported (JSON, XML, others
+	 * don't handle it.) BASE_DEC is just always a bad idea for equality
+	 * testing and serialization, unless you want to allow for strings up
+	 * to 308 characters.
+	 */
 	char *buf = wmem_alloc(scope, G_ASCII_DTOSTR_BUF_SIZE);
-	if (rtype == FTREPR_DFILTER)
-		g_ascii_dtostr(buf, G_ASCII_DTOSTR_BUF_SIZE, fv->value.floating);
-	else
-		g_ascii_formatd(buf, G_ASCII_DTOSTR_BUF_SIZE, "%." G_STRINGIFY(DBL_DIG) "g", fv->value.floating);
+	dtoa_g_fmt(buf, fv->value.floating);
 	return buf;
 }

--- a/epan/proto.c
+++ b/epan/proto.c
@ -31,6 +31,7 @@
 #include <wsutil/wslog.h>
 #include <wsutil/ws_assert.h>
 #include <wsutil/unicode-utils.h>
+#include <wsutil/dtoa.h>

 #include <ftypes/ftypes.h>

@ -10689,7 +10690,6 @@ static size_t
 fill_display_label_float(const field_info *fi, char *label_str)
 {
 	int display;
-	int digits;
 	int n;
 	double value;

@ -10705,12 +10705,11 @@ fill_display_label_float(const field_info *fi, char *label_str)

 	switch (display) {
 		case BASE_NONE:
-			if (fi->hfinfo->type == FT_FLOAT)
-				digits = FLT_DIG;
-			else
-				digits = DBL_DIG;
-
-			n = snprintf(label_str, ITEM_LABEL_LENGTH, "%.*g", digits, value);
+			if (fi->hfinfo->type == FT_FLOAT) {
+				n = snprintf(label_str, ITEM_LABEL_LENGTH, "%.*g", FLT_DIG, value);
+			} else {
+				n = (int)strlen(dtoa_g_fmt(label_str, value));
+			}
 			break;
 		case BASE_DEC:
 			n = snprintf(label_str, ITEM_LABEL_LENGTH, "%f", value);
--- a/resources/Acknowledgements.md
+++ b/resources/Acknowledgements.md
@ -23,3 +23,5 @@ We use the overflow-safe math functions from the [portable snippets](https://git
 We use the [Lrexlib](https://github.com/rrthomas/lrexlib) Lua library, specifically the PCRE2 flavour, to provide a regular expression API for Lua.

 The code for our `strptime()` implementation is from [NetBSD](https://www.netbsd.org/).
+
+We use the [dtoa](https://www.netlib.org/fp/) implementation written by David M. Gay.
--- a/test/suite_dissectors/group_asterix.py
+++ b/test/suite_dissectors/group_asterix.py
@ -696,7 +696,7 @@ class TestCategory019:
            [0x01, 0x80, 0x7f, 0xff, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00],
            "asterix.019_600",
            {
-                "asterix.019_600_LAT": "359.999999832362",
+                "asterix.019_600_LAT": "359.99999983236194",
                "asterix.019_600_LON": "0"
            }
        )
@ -713,7 +713,7 @@ class TestCategory019:
            "asterix.019_600",
            {
                "asterix.019_600_LAT": "0",
-                "asterix.019_600_LON": "359.999999832362"
+                "asterix.019_600_LON": "359.99999983236194"
            }
        )
        validator.add_dissection(
@ -1516,7 +1516,7 @@ class TestCategory048:
        validator.add_dissection(
            [0x10, 0x00, 0x00, 0xff, 0xff],
            "asterix.048_040",
-            dict_local(x_040, "048_040", "THETA", "359.994506835938")
+            dict_local(x_040, "048_040", "THETA", "359.9945068359375")
        )
        x_070 = {
            "asterix.048_070_V": "0",
@ -1766,7 +1766,7 @@ class TestCategory048:
        validator.add_dissection(
            [0x01, 0x04, 0x00, 0x00, 0xff, 0xff],
            "asterix.048_200",
-            dict_local(x_200, "048_200", "HDG", "359.994506835938")
+            dict_local(x_200, "048_200", "HDG", "359.9945068359375")
        )
        x_170 = {
            "asterix.048_170_CNF": "0",
@ -3393,7 +3393,7 @@ class TestCategory063:
            [0x01, 0x80, 0x7f, 0xff],
            "asterix.063_081",
            {
-                "asterix.063_081_VALUE": "179.994506835938"
+                "asterix.063_081_VALUE": "179.9945068359375"
            }
        )
        validator.add_dissection(
@ -3439,7 +3439,7 @@ class TestCategory063:
            [0x01, 0x20, 0x7f, 0xff],
            "asterix.063_091",
            {
-                "asterix.063_091_VALUE": "179.994506835938"
+                "asterix.063_091_VALUE": "179.9945068359375"
            }
        )
        validator.add_dissection(
@ -3453,7 +3453,7 @@ class TestCategory063:
            [0x01, 0x10, 0x7f, 0xff],
            "asterix.063_092",
            {
-                "asterix.063_092_VALUE": "179.994506835938"
+                "asterix.063_092_VALUE": "179.9945068359375"
            }
        )
        validator.add_dissection(
--- a/tools/checklicenses.py
+++ b/tools/checklicenses.py
@ -133,6 +133,12 @@ PATH_SPECIFIC_ALLOWED_LICENSES = {
    '.gitlab/': [
        'UNKNOWN',
    ],
+    'wsutil/dtoa.c': [
+        'dtoa',
+    ],
+    'wsutil/dtoa.h': [
+        'dtoa',
+    ],
    'wsutil/safe-math.h': [ # Public domain (CC0)
        'UNKNOWN',
    ],
--- a/tools/licensecheck.pl
+++ b/tools/licensecheck.pl
@ -713,6 +713,10 @@ sub parselicense {
 			$license = 'ISC';
 		}

+		if ($licensetext =~ /SPDX-License-Identifier:\s+dtoa/i) {
+			$license = 'dtoa';
+		}
+
 		if ($licensetext =~ /(?:is|may be)\s(?:(?:distributed|used).*?terms|being\s+released).*?\b(L?GPL)\b/) {
 			my $v = $gplver || ' (unversioned/unknown version)';
 			$license = "$1$v $license";
@ -740,6 +744,10 @@ sub parselicense {
 			$license = "ISC $license";
 		}

+                if ($licensetext =~ /Permission to use, copy, modify, and distribute this software for any purpose without fee is hereby granted, provided that this entire notice is included in all copies of any software which is or includes a copy or modification of this software and in all copies of the supporting documentation for such software./) {
+			$license = "dtoa $license";
+                }
+
 		if ($licensetext =~ /THIS SOFTWARE IS PROVIDED .*AS IS AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY/) {
 			if ($licensetext =~ /All advertising materials mentioning features or use of this software must display the following acknowledge?ment.*This product includes software developed by/i) {
 					$license = "BSD (4 clause) $license";
--- a/wsutil/CMakeLists.txt
+++ b/wsutil/CMakeLists.txt
@ -178,6 +178,7 @@ set(WSUTIL_COMMON_FILES
 	crc11.c
 	curve25519.c
 	dot11decrypt_wep.c
+	dtoa.c
 	eax.c
 	failure_message_simple.c
 	feature_list.c
--- a/wsutil/dtoa.c
+++ b/wsutil/dtoa.c
--- a/wsutil/dtoa.h
+++ b/wsutil/dtoa.h
@ -0,0 +1,46 @@
+/** @file
+ * David M. Gay dtoa (double to ASCII string) implementation header file
+ *
+ * Wireshark - Network traffic analyzer
+ * By Gerald Combs <gerald@wireshark.org>
+ * Copyright 1998 Gerald Combs
+ *
+ * SPDX-License-Identifier: dtoa
+ */
+
+#pragma once
+
+#include <wireshark.h>
+
+#ifdef __cplusplus
+extern "C" {
+#endif /* __cplusplus */
+
+/* Stores the closest decimal approximation to value in buf;
+ * it suffices to declare buf
+ *      char buf[32];
+ *
+ * Specifically, this finds the shortest possible string that when converted
+ * back to a double will be equal to the original value. There is no single
+ * value that can be passed to snprintf("%.*g") that will work for all cases.
+ *
+ * E.g., for the IEEE 754 double closest to 1/7th (0x1.2492492492492p-3) 17
+ * (DBL_DECIMAL_DIG) digits are required; neither "0.1428571428571428" nor
+ * "0.1428571428571429" suffice, converting to 0x1.249249249249p-3 and
+ * 0x1.2492492492494p-3, respectively. However, for the double closest to
+ * 0.2 (0x1.999999999999ap-3), the closest string with 17 significant digits
+ * is "0.20000000000000001", not "0.2", even though both convert *to* the
+ * same double and would test as equal. So DBL_DECIMAL_DIG is *sufficient*
+ * for serialization but not necessary in all cases and can look particularly
+ * worse in formats where trailing zeros are removed.
+ *
+ * Note C++17 provides std::to_chars to provide the same result, though the
+ * difficulty in implementation caused this to be one of the last widely
+ * supported features across C++ standard libraries. It is not part of the
+ * C standard library functions.
+ */
+WS_DLL_PUBLIC char *dtoa_g_fmt(char *buf, double value);
+
+#ifdef __cplusplus
+}
+#endif /* __cplusplus */