File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change 10
10
asciiLettersBytes = [str (item ) for item in asciiLetters ]
11
11
asciiUppercaseBytes = [str (item ) for item in asciiUppercase ]
12
12
13
- invalid_unicode_re = re .compile (u"[\u0001 -\u0008 \u000B \u000E -\u001F \u007F -\u009F \uD800 -\uDFFF \uFDD0 -\uFDDF \uFFFE \uFFFF \U0001FFFE \U0001FFFF \U0002FFFE \U0002FFFF \U0003FFFE \U0003FFFF \U0004FFFE \U0004FFFF \U0005FFFE \U0005FFFF \U0006FFFE \U0006FFFF \U0007FFFE \U0007FFFF \U0008FFFE \U0008FFFF \U0009FFFE \U0009FFFF \U000AFFFE \U000AFFFF \U000BFFFE \U000BFFFF \U000CFFFE \U000CFFFF \U000DFFFE \U000DFFFF \U000EFFFE \U000EFFFF \U000FFFFE \U000FFFFF \U0010FFFE \U0010FFFF ]" )
13
+ invalid_unicode_re = re .compile (u"[\u0001 -\u0008 \u000B \u000E -\u001F \u007F -\u009F \uD800 -\uDFFF \uFDD0 -\uFDEF \uFFFE \uFFFF \U0001FFFE \U0001FFFF \U0002FFFE \U0002FFFF \U0003FFFE \U0003FFFF \U0004FFFE \U0004FFFF \U0005FFFE \U0005FFFF \U0006FFFE \U0006FFFF \U0007FFFE \U0007FFFF \U0008FFFE \U0008FFFF \U0009FFFE \U0009FFFF \U000AFFFE \U000AFFFF \U000BFFFE \U000BFFFF \U000CFFFE \U000CFFFF \U000DFFFE \U000DFFFF \U000EFFFE \U000EFFFF \U000FFFFE \U000FFFFF \U0010FFFE \U0010FFFF ]" )
14
14
15
15
ascii_punctuation_re = re .compile (ur"[\u0009-\u000D\u0020-\u002F\u003A-\u0040\u005B-\u0060\u007B-\u007E]" )
16
16
Original file line number Diff line number Diff line change @@ -178,7 +178,7 @@ def consumeNumberEntity(self, isHex):
178
178
# Certain characters get replaced with U+FFFD
179
179
if ((charAsInt <= 0x0008 ) or (charAsInt == 0x000B ) or (0x000E <= charAsInt <= 0x001F )
180
180
or (0x007F <= charAsInt <= 0x009F )
181
- or (0xD800 <= charAsInt <= 0xDFFF ) or (0xFDD0 <= charAsInt <= 0xFDDF )
181
+ or (0xD800 <= charAsInt <= 0xDFFF ) or (0xFDD0 <= charAsInt <= 0xFDEF )
182
182
or (charAsInt & 0xFFFE == 0xFFFE ) # catch all U+?FFFE and U+?FFFF, where ? is 0..10
183
183
or (0x10FFFF < charAsInt )):
184
184
char = u"\uFFFD "
You can’t perform that action at this time.
0 commit comments