From 648d871ab448b81dc714dcbdca955afd9a9bc3c3 Mon Sep 17 00:00:00 2001 From: albert-github Date: Mon, 23 Sep 2019 15:47:01 +0200 Subject: HTML attribute name A HTML attribute name can have e.g. a XML namespace in it and thus containing a colon (`:`) like: ``` Social Icons ``` but this results in ``` warning: found tag without matching ``` and grabled outpuzt. allowing a colon in the attribute name solves this problem --- src/doctokenizer.l | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/doctokenizer.l b/src/doctokenizer.l index 9786720..22b14a0 100644 --- a/src/doctokenizer.l +++ b/src/doctokenizer.l @@ -350,7 +350,7 @@ LISTITEM {BLANK}*[-]("#")?{WS} MLISTITEM {BLANK}*[+*]{WS} OLISTITEM {BLANK}*[1-9][0-9]*"."{BLANK} ENDLIST {BLANK}*"."{BLANK}*\n -ATTRNAME [a-z_A-Z\x80-\xFF][a-z_A-Z0-9\x80-\xFF\-]* +ATTRNAME [a-z_A-Z\x80-\xFF][:a-z_A-Z0-9\x80-\xFF\-]* ATTRIB {ATTRNAME}{WS}*("="{WS}*(("\""[^\"]*"\"")|("'"[^\']*"'")|[^ \t\r\n'"><]+))? URLCHAR [a-z_A-Z0-9\!\~\,\:\;\'\$\?\@\&\%\#\.\-\+\/\=] URLMASK ({URLCHAR}+([({]{URLCHAR}*[)}])?)+ -- cgit v0.12