From a9f50d33e5a32910a09035ea5927706c74be0d64 Mon Sep 17 00:00:00 2001 From: Karl Williamson Date: Sun, 18 Aug 2013 08:50:34 -0600 Subject: [PATCH] utf8.h, unicode_constants.h: Add some #defines. These will be used in a future commit --- regen/unicode_constants.pl | 3 +++ unicode_constants.h | 3 +++ utf8.h | 2 ++ 3 files changed, 8 insertions(+) diff --git a/regen/unicode_constants.pl b/regen/unicode_constants.pl index 78a7c96..bbd4497 100644 --- a/regen/unicode_constants.pl +++ b/regen/unicode_constants.pl @@ -155,6 +155,9 @@ U+03C5 string U+1E9E string +U+FB05 string +U+FB06 string + U+2010 string U+D800 first FIRST_SURROGATE BOM first diff --git a/unicode_constants.h b/unicode_constants.h index 38b438a..4037950 100644 --- a/unicode_constants.h +++ b/unicode_constants.h @@ -35,6 +35,9 @@ #define LATIN_CAPITAL_LETTER_SHARP_S_UTF8 "\xE1\xBA\x9E" /* U+1E9E */ +#define LATIN_SMALL_LIGATURE_LONG_S_T_UTF8 "\xEF\xAC\x85" /* U+FB05 */ +#define LATIN_SMALL_LIGATURE_ST_UTF8 "\xEF\xAC\x86" /* U+FB06 */ + #define HYPHEN_UTF8 "\xE2\x80\x90" /* U+2010 */ #define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xED /* U+D800 */ #define BOM_UTF8_FIRST_BYTE 0xEF /* U+FEFF */ diff --git a/utf8.h b/utf8.h index 1be5a12..7dcea6f 100644 --- a/utf8.h +++ b/utf8.h @@ -536,6 +536,8 @@ Perl's extended UTF-8 means we can have start bytes up to FF. #define LATIN_CAPITAL_LETTER_Y_WITH_DIAERESIS 0x0178 /* Also is title case */ #define LATIN_CAPITAL_LETTER_SHARP_S 0x1E9E #define LATIN_SMALL_LETTER_LONG_S 0x017F +#define LATIN_SMALL_LIGATURE_LONG_S_T 0xFB05 +#define LATIN_SMALL_LIGATURE_ST 0xFB06 #define KELVIN_SIGN 0x212A #define ANGSTROM_SIGN 0x212B -- 2.7.4