diff options
author | Ezio Melotti <ezio.melotti@gmail.com> | 2022-06-21 20:03:12 (GMT) |
---|---|---|
committer | GitHub <noreply@github.com> | 2022-06-21 20:03:12 (GMT) |
commit | f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d (patch) | |
tree | 05991a453bb4bda4aa6e2f9f54ed9fe8b58d2333 /Lib/html | |
parent | 4e08fbcfdfa57ea94091aabdd09413708e3fb2bf (diff) | |
download | cpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.zip cpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.tar.gz cpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.tar.bz2 |
gh-82927: Update files related to HTML entities. (GH-92504)
Diffstat (limited to 'Lib/html')
-rw-r--r-- | Lib/html/entities.py | 9 |
1 files changed, 6 insertions, 3 deletions
diff --git a/Lib/html/entities.py b/Lib/html/entities.py index dc50863..cc59bc3 100644 --- a/Lib/html/entities.py +++ b/Lib/html/entities.py @@ -3,8 +3,7 @@ __all__ = ['html5', 'name2codepoint', 'codepoint2name', 'entitydefs'] -# maps the HTML entity name to the Unicode code point -# from https://html.spec.whatwg.org/multipage/named-characters.html +# maps HTML4 entity name to the Unicode code point name2codepoint = { 'AElig': 0x00c6, # latin capital letter AE = latin capital ligature AE, U+00C6 ISOlat1 'Aacute': 0x00c1, # latin capital letter A with acute, U+00C1 ISOlat1 @@ -261,7 +260,11 @@ name2codepoint = { } -# maps the HTML5 named character references to the equivalent Unicode character(s) +# HTML5 named character references +# Generated by 'Tools/scripts/parse_html5_entities.py' +# from https://html.spec.whatwg.org/entities.json and +# https://html.spec.whatwg.org/multipage/named-characters.html. +# Map HTML5 named character references to the equivalent Unicode character(s). html5 = { 'Aacute': '\xc1', 'aacute': '\xe1', |