[Bug 9207] Anything else: This part of the spec is problematic, for example, a query string variable &lang_id=1 in as part of an attribute of say an img tag, will get converted into an character token when it shouldn't be. Why is the set of characters a-z, A-Z, 0-

http://www.w3.org/Bugs/Public/show_bug.cgi?id=9207





--- Comment #6 from Simon Pieters <simonp@opera.com>  2010-03-29 09:06:24 ---
If anyone wants to look at the individual cases, I modified the script in
http://simon.html5.org/dump/entities-in-attribute-with-no-semicolon-or-alphanumeric.xml
as follows to show only '/':

<script><![CDATA[
onload=function(){
  var pre = document.getElementsByTagName('pre')[1];
  var lines = pre.textContent.split('\n');
  var data = [];
  var chars = {};
  var tmp;
  var tmp2;
  for (var i = 0; i < lines.length; ++i) {
    tmp = /^([^\t]+)\t(.+)$/.exec(lines[i]);
    tmp2 =
/&(AElig|AMP|Aacute|Acirc|Agrave|Aring|Atilde|Auml|COPY|Ccedil|ETH|Eacute|Ecirc|Egrave|Euml|GT|Iacute|Icirc|Igrave|Iuml|LT|Ntilde|Oacute|Ocirc|Ograve|Oslash|Otilde|Ouml|QUOT|REG|THORN|Uacute|Ucirc|Ugrave|Uuml|Yacute|aacute|acirc|acute|aelig|agrave|amp|aring|atilde|auml|brvbar|ccedil|cedil|cent|copy|curren|deg|divide|eacute|ecirc|egrave|eth|euml|frac12|frac14|frac34|gt|iacute|iuml|laquo|lt|macr|micro|middot|nbsp|not|ntilde|oacute|ocirc|ograve|ordf|ordm|oslash|otilde|ouml|para|plusmn|pound|quot|raquo|reg|sect|shy|sup1|sup2|sup3|szlig|thorn|times|uacute|ucirc|ugrave|uml|uuml|yacute|yen|yuml)([^;a-zA-Z0-9])/.exec(tmp[2]);
    for (var j = 2; j < tmp2.length; ++j) {

      // CHANGE HERE:
      if (tmp2[j] == '/')
        data.push([tmp[1], tmp[2]]);
    }
  }
  for (i = 0; i < data.length; ++i) {
    document.getElementsByTagName('pre')[0].textContent += data[i][1] + '\n\n';
  }
}
]]></script>


-- 
Configure bugmail: http://www.w3.org/Bugs/Public/userprefs.cgi?tab=email
------- You are receiving this mail because: -------
You are the QA contact for the bug.

Received on Monday, 29 March 2010 09:06:26 UTC