diff options
Diffstat (limited to '')
-rw-r--r-- | wsutil/utf8_entities.h | 75 |
1 files changed, 75 insertions, 0 deletions
diff --git a/wsutil/utf8_entities.h b/wsutil/utf8_entities.h new file mode 100644 index 00000000..3d2f2533 --- /dev/null +++ b/wsutil/utf8_entities.h @@ -0,0 +1,75 @@ +/** @file + * + * Byte sequences for various UTF-8 entities + * + * Wireshark - Network traffic analyzer + * By Gerald Combs <gerald@wireshark.org> + * Copyright 1998 Gerald Combs + * + * SPDX-License-Identifier: GPL-2.0-or-later + */ + + +#ifndef __UTF8_ENTITIES_H__ +#define __UTF8_ENTITIES_H__ + +/* + * Sequences can be found at + * http://www.fileformat.info/info/unicode/ + * http://www.utf8-chartable.de/ + * and other places + * + * Please be conservative when adding code points below. While many modern + * systems default to UTF-8 and handle it well, some do not. The Windows + * console is a notable example. As a general rule you probably shouldn't + * stray too far from code page 437 or WGL4: + * https://en.wikipedia.org/wiki/Code_page_437 + * https://en.wikipedia.org/wiki/Windows_Glyph_List_4 + * + * Hopefully we can dispense with the sequences below and simply encode our + * files as UTF 8 at some point. For example gcc has supported UTF 8 since + * at least 3.4. Visual C++ on the other hand is much more problematic. + * 2015 and later support /source-charset:utf-8, but prior versions appear + * to require a UTF 8 BOM. + */ + +#define UTF8_DEGREE_SIGN "\xc2\xb0" /* 176 / 0xb0 */ +#define UTF8_SUPERSCRIPT_TWO "\xc2\xb2" /* 178 / 0xb2 */ +#define UTF8_MICRO_SIGN "\xc2\xb5" /* 181 / 0xb5 */ +#define UTF8_MIDDLE_DOT "\xc2\xb7" /* 183 / 0xb7 */ +#define UTF8_RIGHT_POINTING_DOUBLE_ANGLE_QUOTATION_MARK "\xc2\xbb" /* 187 / 0xbb */ + +#define UTF8_BULLET "\xe2\x80\xa2" /* 8226 / 0x2024 */ +#define UTF8_EM_DASH "\xe2\x80\x94" /* 8212 / 0x2014 */ +#define UTF8_HORIZONTAL_ELLIPSIS "\xe2\x80\xa6" /* 8230 / 0x2026 */ + +#define UTF8_LEFTWARDS_ARROW "\xe2\x86\x90" /* 8592 / 0x2190 */ +#define UTF8_RIGHTWARDS_ARROW "\xe2\x86\x92" /* 8594 / 0x2192 */ +#define UTF8_LEFT_RIGHT_ARROW "\xe2\x86\x94" /* 8596 / 0x2194 */ + +/* macOS command key */ +#define UTF8_PLACE_OF_INTEREST_SIGN "\xe2\x8c\x98" /* 8984 / 0x2318 */ + +#define UTF8_SYMBOL_FOR_NULL "\xe2\x90\x80" /* 9216 / 0x2400 */ + +#define UTF8_CHECK_MARK "\xe2\x9c\x93" /* 10003 / 0x2713 */ +#define UTF8_BALLOT_X "\xe2\x9c\x97" /* 10007 / 0x2717 */ +#define UTF8_LONG_RIGHTWARDS_ARROW "\xe2\x9f\xb6" /* 10230 / 0x27f6 */ + +#define UTF8_ZERO_WIDTH_NO_BREAK_SPACE "\xef\xbb\xbf" /* 65279 / 0xffef */ +#define UTF8_BOM UTF8_ZERO_WIDTH_NO_BREAK_SPACE + +#endif /* __UTF8_ENTITIES_H__ */ + +/* + * Editor modelines + * + * Local Variables: + * c-basic-offset: 4 + * tab-width: 8 + * indent-tabs-mode: nil + * End: + * + * ex: set shiftwidth=4 tabstop=8 expandtab + * :indentSize=4:tabSize=8:noTabs=true: + */ |