summaryrefslogtreecommitdiffstats
path: root/Lib/html
diff options
context:
space:
mode:
authorEzio Melotti <ezio.melotti@gmail.com>2022-06-21 20:03:12 (GMT)
committerGitHub <noreply@github.com>2022-06-21 20:03:12 (GMT)
commitf28ec34c5c69f45dc0db8bc26df69bc7defe9c9d (patch)
tree05991a453bb4bda4aa6e2f9f54ed9fe8b58d2333 /Lib/html
parent4e08fbcfdfa57ea94091aabdd09413708e3fb2bf (diff)
downloadcpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.zip
cpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.tar.gz
cpython-f28ec34c5c69f45dc0db8bc26df69bc7defe9c9d.tar.bz2
gh-82927: Update files related to HTML entities. (GH-92504)
Diffstat (limited to 'Lib/html')
-rw-r--r--Lib/html/entities.py9
1 files changed, 6 insertions, 3 deletions
diff --git a/Lib/html/entities.py b/Lib/html/entities.py
index dc50863..cc59bc3 100644
--- a/Lib/html/entities.py
+++ b/Lib/html/entities.py
@@ -3,8 +3,7 @@
__all__ = ['html5', 'name2codepoint', 'codepoint2name', 'entitydefs']
-# maps the HTML entity name to the Unicode code point
-# from https://html.spec.whatwg.org/multipage/named-characters.html
+# maps HTML4 entity name to the Unicode code point
name2codepoint = {
'AElig': 0x00c6, # latin capital letter AE = latin capital ligature AE, U+00C6 ISOlat1
'Aacute': 0x00c1, # latin capital letter A with acute, U+00C1 ISOlat1
@@ -261,7 +260,11 @@ name2codepoint = {
}
-# maps the HTML5 named character references to the equivalent Unicode character(s)
+# HTML5 named character references
+# Generated by 'Tools/scripts/parse_html5_entities.py'
+# from https://html.spec.whatwg.org/entities.json and
+# https://html.spec.whatwg.org/multipage/named-characters.html.
+# Map HTML5 named character references to the equivalent Unicode character(s).
html5 = {
'Aacute': '\xc1',
'aacute': '\xe1',