- From: CVS User fsasaki <cvsmail@w3.org>
- Date: Thu, 30 May 2013 07:53:26 +0000
- To: public-multilingualweb-lt-commits@w3.org
Update of /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20 In directory gil:/tmp/cvs-serv23674 Modified Files: build.xml its20-for-editing-sec1-sec2.odd Added Files: its20-for-editing-sec1-sec2.html Log Message: updating build for sec 1-2 editing and making a few edits in sec 1 and 2 --- /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/build.xml 2013/05/20 09:25:59 1.19 +++ /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/build.xml 2013/05/30 07:53:26 1.20 @@ -39,21 +39,17 @@ <classpath refid="jing.classpath"/> </java> </target> - - <!-- - <target name="odd2xmlspec" depends="validateOdd"> - <java fork="true" classname="com.icl.saxon.StyleSheet"> - <classpath refid="saxon1-0.classpath"/> - <classpath refid="parse-html5.classpath"/> - <classpath refid="html5parser.classpath"/> - <arg value="-o"/> - <arg value="temp/its20-xmlspec.xml"/> - <arg value="its20.odd"/> - <arg value="tools/xslt/odd2xmlspec.xsl"/> + + <target name="validateOdd-sec1-sec2"> + <java fork="true" classname="com.thaiopensource.relaxng.util.Driver"> + <arg value="-c"/> + <arg value="tools/tei-w3c.rnc"/> + <arg value="its20-for-editing-sec1-sec2.odd"/> + <classpath refid="jing.classpath"/> </java> </target> - --> - <target name="odd2xmlspec" depends="validateOdd"> + + <target name="odd2xmlspec"> <java fork="true" classname="net.sf.saxon.Transform"> <classpath refid="saxon9.classpath"/> <arg value="-o:temp/its20-xmlspec.xml"/> @@ -61,8 +57,17 @@ <arg value="-xsl:tools/xslt/odd2xmlspec.xsl"/> </java> </target> + + <target name="odd2xmlspec-sec1-sec2"> + <java fork="true" classname="net.sf.saxon.Transform"> + <classpath refid="saxon9.classpath"/> + <arg value="-o:temp/its20-xmlspec.xml"/> + <arg value="-s:its20-for-editing-sec1-sec2.odd"/> + <arg value="-xsl:tools/xslt/odd2xmlspec.xsl"/> + </java> + </target> - <target name="makeXmlspecValid" depends="odd2xmlspec"> + <target name="makeXmlspecValid"> <java fork="true" classname="net.sf.saxon.Transform"> <classpath refid="saxon9.classpath"/> <arg value="-o:temp/its20-valid-xmlspec.xml"/> @@ -72,7 +77,7 @@ <xmlvalidate file="temp/its20-valid-xmlspec.xml"/> </target> - <target name="xmlspec2Html" depends="makeXmlspecValid"> + <target name="xmlspec2Html"> <replaceregexp file="temp/its20-valid-xmlspec.xml" match="<w3c-doctype>.*</w3c-doctype>" replace="<w3c-doctype>Editor's Copy</w3c-doctype>" flags="" encoding="utf-8"/> @@ -97,10 +102,17 @@ <arg value="temp/its20.html"/> <arg value="tools/xslt/makeedcopy.xsl"/> </java> + </target> + + <target name="copy2Edcopy"> <copy file="temp/temp.html" tofile="its20.html"/> </target> - <target name="xmlspec2TrHtml" depends="makeXmlspecValid"> + <target name="copy2Edcopy-sec1-sec2"> + <copy file="temp/temp.html" tofile="its20-for-editing-sec1-sec2.html"/> + </target> + + <target name="xmlspec2TrHtml"> <replaceregexp file="temp/its20-valid-xmlspec.xml" match="role="editors-copy"" replace="" encoding="utf-8"/> <replaceregexp file="temp/its20-valid-xmlspec.xml" match="w3c-doctype=".*"" @@ -219,9 +231,21 @@ </delete> </target> - <target name="all" depends="xmlspec2Html, xmlspec2TrHtml"/> + <target name="generate-ed-copy" depends="validateOdd, odd2xmlspec, makeXmlspecValid, xmlspec2Html, copy2Edcopy"> + <echo>GENERATION EDITORS COPY - DONE</echo> + </target> + + <target name="generate-tr-version" depends="validateOdd, odd2xmlspec, makeXmlspecValid, xmlspec2TrHtml"> + <echo>GENERATION TR VERSION - DONE</echo> + </target> + + <!-- Below target is temporary for editing sec 1 and sec 2, with its20-for-editing-sec1-sec2.odd as the ODD file. --> + + <target name="generate-sec1-2" depends="validateOdd-sec1-sec2, odd2xmlspec-sec1-sec2, makeXmlspecValid, xmlspec2Html, copy2Edcopy-sec1-sec2"> + <echo>GENERATION SEC1 - SEC2 VERSION - DONE</echo> + </target> - <target name="main" depends="xmlspec2Html"/> + <target name="main" depends="generate-ed-copy"/> <taskdef name="jing" classname="com.thaiopensource.relaxng.util.JingTask" classpathref="jing.classpath"/> @@ -242,22 +266,4 @@ <arg value="tools/xslt/disco-for-its20.xsl"/> </java> </target> - - <target name="testsuite-dashboard"> - <get src="https://github.com/finnle/ITS-2.0-Testsuite/archive/master.zip" - dest="temp/master.zip"/> - <unzip src="temp/master.zip" dest="temp"/> - <java fork="true" classname="net.sf.saxon.Transform"> - <classpath refid="saxon9.classpath"/> - <arg value="-o:temp/testsuiteMaster.xml"/> - <arg value="temp/TestSuiteCommitmentsFromGD.xml"/> - <arg value="temp/GD2testsuiteMaster.xsl"/> - </java> - <java fork="true" classname="net.sf.saxon.Transform"> - <classpath refid="saxon9.classpath"/> - <arg value="-o:temp/testSuiteDashboard.html"/> - <arg value="temp/testsuiteMaster.xml"/> - <arg value="tools/xslt/testsuiteDashboard.xsl"/> - </java> - </target> </project> --- /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/its20-for-editing-sec1-sec2.odd 2013/05/29 16:53:24 1.2 +++ /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/its20-for-editing-sec1-sec2.odd 2013/05/30 07:53:26 1.3 @@ -343,10 +343,10 @@ </p> - <egXML xmlns="http://www.tei-c.org/ns/Examples" target="examples/xml/EX-ways-to-use-its-0.xml" /> - </exemplum> - + + <note type="ed">Need to provide example: <![CDATA[ + <egXML xmlns="http://www.tei-c.org/ns/Examples" target="examples/xml/EX-ways-to-use-its-0.xml" />]]></note> <p> Like ITS 1.0, ITS 2.0 @@ -419,12 +419,121 @@ </div> - <div xml:id="general-motiviation-for-ITS2.0"><head>General motivation for going beyond ITS 1.0</head> <p>tbd</p></div> + <div xml:id="general-motiviation-for-ITS2.0"><head>General motivation for going beyond ITS 1.0</head> <note type="ed">We need to have the example <ref target="examples/xml/EX-motivation-its-2.xml">EX-motivation-its-2.xml</ref> here since it was part of resolving <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/100">issue-100</ref>.</note> + <exemplum xml:id="EX-motivation-its-1"> + <head>Document with partially translatable content</head> + <p>In this document it is difficult to distinguish between those <code>string</code> + elements that are translatable and those that are not. Only the addition of an + explicit flag could resolve the issue.</p> + <egXML xmlns="http://www.tei-c.org/ns/Examples" + target="examples/xml/EX-motivation-its-1.xml"/> + </exemplum> + <exemplum xml:id="EX-motivation-its-2"> + <head>Document with partially translatable content</head> + <p>Even when metadata are available to identify non-translatable text, the conditions + may be quite complex and not directly indicated with a simple flag. Here, for + instance, only the text in the nodes matching the expression + <code>//component[@type!='image']/data[@type='text']</code> is translatable.</p> + <egXML xmlns="http://www.tei-c.org/ns/Examples" + target="examples/xml/EX-motivation-its-2.xml"/> + </exemplum></div> <div xml:id="usage-scenarios"><head>Broader Usage Scenarios</head> <p>tbd</p></div> <div xml:id="high-level-differences-between-1.0-and-2.0"><head>High-level differences between ITS 1.0 and ITS 2.0</head> - + <div xml:id="specific-HTML-support"><head>Specific HTML support</head> + + <p>For applying ITS 2.0 data categories to HTML, four aspects must be considered:</p> + <list type="ordered"> + <item>referencing global rules</item> + <item>specifities of inserting local ITS 2.0 data categories</item> + <item>relationship between HTML markup and data categories, and</item> + <item>HTML version.</item> + </list> + <p>In the following sections these aspects are briefly discussed.</p> + <div xml:id="html5-reference-global-rules"><head>Referencing global rules</head> + <p>To account for the so-called “<ref target="#basic-concepts-selection-global">global + approach</ref>” in HTML, this specification (see <ptr target="#html5-global-rules" type="specref"/>) defines a link type for referring to external files + with global rules and an approach to have inline global rules in the HTML <code>script</code> element. + It is preferred to use external global rules linked via the <code>link</code> element than to have inline global rules in the HTML document.</p> + <exemplum xml:id="EX-translate-html5-global-1"> + <head>Using ITS global rules in HTML</head> + <p>The <code>link</code> element points to the rules file + <code>EX-translateRule-html5-1.xml</code> The <code>rel</code> attribute identifies + the ITS specific link relation <code>its-rules</code>.</p> + <egXML xmlns="http://www.tei-c.org/ns/Examples" + target="examples/html5/EX-translate-html5-global-1.html" type="html5"/> + </exemplum> + <exemplum xml:id="EX-translate-html5-global-1-rules-file"> + <head>ITS rules file linked from HTML</head> + <p>The rules file linked in <ptr target="#EX-translate-html5-global-1" type="exref" + />.</p> + <egXML xmlns="http://www.tei-c.org/ns/Examples" + target="examples/html5/EX-translateRule-html5-1.xml"/> + </exemplum> + </div> + <div xml:id="html5-its-local-markup"><head>Specifities of inserting local ITS 2.0 data categories</head> + <p>In HTML, an ITS 2.0 local data category is realized with the specific prefix <code>its-*</code>. + The general mapping of the XML based ITS 2.0 attributes to their HTML <code>its-*</code> counterparts is defined in + <ptr target="#html5-local-attributes" type="specref"/>. An informative table in <ptr target="#list-of-elements-and-attributes" type="specref"/> + provides an overview of the mapping for all data categories.</p> + </div> + <div xml:id="html5-existing-markup-versus-its"><head>Relation between HTML markup and ITS 2.0 data categories</head> + <p>There are four ITS 2.0 data categories, which have direct counterparts + in HTML markup. For theses data categories, ITS 2.0 defines the following specific + behaviour:</p> + <list type="unordered"> + <item>The <ref target="#language-information">Language Information</ref> data category has the HTML <code>lang</code> + attribute counterpart; in XHTML this is the <code>xml:lang</code> attribute. These attributes act as + local markup for the <ref target="#language-information">Language Information</ref> data category in HTML and + take <ref target="#selection-precedence">precedence</ref> over language information conveyed via a global <gi>langRule</gi>.</item> + <item>The <ref target="#idvalue">Id Value</ref> data category has the HTML or XHTML <code>id</code> attribute. + This attribute acts as local markup for the <ref target="#idvalue">Id Value</ref> data category in HTML and take <ref target="#selection-precedence">precedence</ref> over + id information conveyed via a global <gi>idValueRule</gi>.</item> + <item>The <ref target="#elements-within-text">Elements within Text</ref> data category has a set of HTML + elements defined as <ref target="http://www.w3.org/TR/html51/dom.html#phrasing-content-1">phrasing content</ref>. In the absence of an + <ref target="#elements-within-text">Elements within Text</ref> local attribute or global rules selecting the + element in question, these elements are always interpreted as + <code>withinText="yes"</code> by default, except for the elements <gi>iframe</gi>, <gi>noscript</gi>, <gi>script</gi> + and <gi>textarea</gi> which are interpreted as <code>withinText="nested"</code>.</item> + <item>The <ref target="#trans-datacat">Translate</ref> data category has a direct counterpart in + <ptr target="#html5" type="bibref"/>, namely the HTML5 + <code>translate</code> attribute. ITS 2.0 does not define its own behaviour for HTML5 <code>translate</code>, but just refers to <ref target="http://www.w3.org/TR/html51/dom.html#the-translate-attribute">the HTML5 definition</ref>.</item> + </list> + <exemplum xml:id="EX-its-and-existing-HTML5-markup"> + <head>The <ref target="#language-information">Language Information</ref>, <ref target="#idvalue">Id Value</ref>, + <ref target="#elements-within-text">Elements within Text</ref> and <ref target="#trans-datacat">Translate</ref> + ITS 2.0 data categories used with + HTML native markup.</head> + <p>The <code>html</code> element is interpreted to convey the + <ref target="#language-information">Language Information</ref> value <val>en</val>. + The <code>p</code> element is interpreted to + convey the <ref target="#idvalue">Id Value</ref> of <val>p1</val>. The <code>em</code> element + is interpreted to be <code>withinText="yes"</code>. The <code>img</code> element is set to be translatable via an <ptr target="#html5" type="bibref"/> <code>translate</code> attribute. Here the <code>alt</code> attribute will also be translatable.</p> + <egXML xmlns="http://www.tei-c.org/ns/Examples" + target="examples/html5/EX-its-and-existing-HTML5-markup.html"/> + </exemplum> + <p>There are also some HTML markup elements that have similar, but not always identical, roles and behaviour than certain ITS 2.0 data categories. + For example, the HTML <code>dfn</code> element + could be used to identify a term in the sense of the <ref target="#terminology">Terminology</ref> data + category. However, this is not always the case and it depends on the + intentions of the content author. To accomodate this situation, users + of ITS 2.0 are encouraged to specifiy the association of existing HTML + markup with a dedicated global rules file. For an example rules file see the + <ref target="http://www.w3.org/TR/2008/NOTE-xml-i18n-bp-20080213/#relating-its-plus-xhtml">XML I18N Best Practices</ref> document.</p> + </div> + <div xml:id="html5-standoff-markup-explanation"><head>Standoff Markup in HTML5</head> + <p>The <ref target="#provenance">Provenance</ref> and the <ref target="#lqissue">Localization Quality Issue</ref> data categories allow for using standoff markup. In HTML such standoff markup is put into a <code>script</code> element. The constraints for <ref target="#provenance-records-in-html5-constraint">Provenance standoff</ref> markup in HTML and <ref target="#loc-quality-issues-in-html5-constraint">Localization quality issue</ref> markup in HTML need to be taken into account. Examples of standoff markup in HTML for the two data categories are <ptr target="#EX-provenance-html5-local-2" type="exref"/> and <ptr target="#EX-locQualityIssue-html5-local-2" type="exref"/>.</p></div> + <div xml:id="usage-in-legacy-html"> + <head>Version of HTML</head> + <p>ITS 2.0 does not define how to use ITS in HTML versions prior version 5. Users are + encouraged to migrate their content to HTML5 or XHTML. While it is possible to use + <code>its-*</code> attributes introduced for <ptr target="#html5" type="bibref"/> in older versions of HTML (such + as 3.2 or 4.01) and pages using these attributes will work without any problems, + <code>its-*</code> attributes will be marked as invalid in validators.</p> + </div> + </div> + <!-- http://lists.w3.org/Archives/Public/public-multilingualweb-lt-comments/2013Jan/0018.html @@ -466,7 +575,9 @@ <div xml:id="additional-data-categories"><head>Additional data categories</head> <p>tbd</p></div> - <div xml:id="modified-datacategories"><head>Modified data categories</head> <p>tbd</p></div> + <div xml:id="modified-datacategories"><head>Modified data categories</head> <p>tbd</p> + + </div> <div xml:id="additional-mechanisms"><head>Additional or modified mechanisms</head> @@ -480,7 +591,7 @@ </div> - <div xml:id="specific-HTML-support"><head>Specific HTML support</head> <p>tbd</p></div> + <div xml:id="mappings"><head>Mappings</head> @@ -4442,9 +4553,9 @@ generation. In most Content Management Systems, content is divided into several fields, some of which may be restricted to plain text, while in other fields HTML fragments may be allowed. Enforcing such restrictions is outside the scope of this - data category. For further information see <ptr target="#content-producers" - type="specref"/>.</p> + data category.</p> </note> + <note type="ed">Removed reference to <ref target="http://www.w3.org/International/multilingualweb/lt/drafts/its20/its20.html#content-producers">content producers</ref> description in introduction here.</note> <p>The set of characters that are allowed is specified using a regular expression. That is, each character in the selected content <ref target="#rfc-keywords">MUST</ref> be included in the set specified by the regular expression.</p> @@ -5854,12 +5965,12 @@ see <ref target="https://www.w3.org/International/multilingualweb/lt/track/actions/493">action-493</ref>.</item> <item>Updated the definition of the regular expression to use in the <ptr type="specref" target="#allowedchars"/> data category, see <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/67">issue-67</ref>.</item> - <item>Updated <ptr target="#usage-in-html" type="specref"/> to reflect discussion on HTML defaults, see <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/89">issue-89</ref>, <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/97">issue-97</ref> and <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/118">issue-118</ref>.</item> + <item>Updated <ptr target="#specific-HTML-support" type="specref"/> to reflect discussion on HTML defaults, see <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/89">issue-89</ref>, <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/97">issue-97</ref> and <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/118">issue-118</ref>.</item> <item>Clarified <ref target="#provenance-records-in-html5-constraint">provenance</ref> and <ref target="#loc-quality-issues-in-html5-constraint">localization quality issue</ref> standoff constraints for HTML5, see related <ref target="http://lists.w3.org/Archives/Public/public-multilingualweb-lt/2013May/0032.html">mail thread</ref>.</item> <item>Edits related to HTML defaults for <ref target="#elements-within-text">Elements Within Text</ref> and <ref target="#language-information">Language Information</ref>, see <ref target="http://lists.w3.org/Archives/Public/public-multilingualweb-lt/2013May/0010.html">mail thread</ref> and <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/118">issue-118</ref>.</item> - <item>Added <ptr target="#its-and-xliff" type="specref"/>.</item> + <item>Added section about ITS and XLIFF to <ptr type="specref" target="#introduction"/>.</item> <item>Added a <ref target="#text-analyis-serializations">note on serializations</ref> of the <ref target="#textanalysis">Text Analysis</ref> data category.</item> <item>Added <ref target="#its-conformance-2-5">conformance clause 2-5</ref> about non ITS elements and attributes and a <ref target="#foreign-elements">related paragraph</ref> to <ptr target="#its-schemas" type="specref"/>, see <ref target="https://www.w3.org/International/multilingualweb/lt/track/actions/527">action-527</ref>.</item> <item>Made <att>annotatorsRef</att> only needed for <ref target="#terminology">Terminology</ref>, <ref target="#textanalysis">Text Analysis</ref> and <ref target="#mtconfidence">MT Confidence</ref>, see <ref target="https://www.w3.org/International/multilingualweb/lt/track/issues/71">issue-71</ref>.</item> @@ -6054,8 +6165,7 @@ <att>domainPointer</att> attribute in <ptr target="#EX-domain-2" type="exref"/> and <ref target="https://www.w3.org/International/multilingualweb/lt/track/actions/282" >action-282</ref>.</item> - <item>Defined <ref target="#directionality">Directionality</ref> and Ruby as non-normative features. See <ptr - target="#relation-to-its10" type="specref"/>, note on directionality and <ref + <item>Defined <ref target="#directionality">Directionality</ref> and Ruby as non-normative features. See note on directionality and <ref target="https://www.w3.org/International/multilingualweb/lt/track/actions/250" >action-250</ref>.</item> <item>Update on Disambiguation example <ptr @@ -6104,8 +6214,8 @@ analysis annotation requirement</ref> is covered by the local disambiguation attribute disambigConfidence, in conjunction with <ptr target="#its-tool-annotation" type="specref"/>.</item> - <item>Added explanations about ITS 2.0 and plain text in CMS to <ptr - target="#content-producers" type="specref"/> and <ptr + <item>Added explanations about ITS 2.0 and plain text in CMS to <q>content producers</q> + definition in introduction and <ptr target="#allowedchars-definition" type="specref"/> - see <ref target="https://www.w3.org/International/multilingualweb/lt/track/actions/262" >action-262</ref> and <ref @@ -6210,7 +6320,7 @@ >data category overview table</ref>.</p> </item> <item> - <p>Added new kind of user to <ptr target="#potential-users" type="specref"/>.</p> + <p>Added new kind of user to <ptr target="#introduction" type="specref"/>.</p> </item> <item> <p>Added the algorithm to obtain the value of the <ref target="#domain">Domain</ref> @@ -6256,12 +6366,11 @@ <list type="ordered"> <item>Various editorial changes (non-normative references update, style & grammar fixes).</item> - <item>Made clarifications to <ptr target="#out-of-scope" type="specref"/>, <ptr - type="specref" target="#design-decisions"/>.</item> + <item>Made clarifications to <q>out of scope</q> list and <q>design decisions</q>in <ptr target="#introduction" type="specref"/>.</item> <item>Added explanatory note on precedence and overriding in <ptr target="#selection-precedence" type="specref"/>.</item> <item>Reordered some components in <ptr type="specref" target="#introduction"/>.</item> - <item>Restructured <ptr target="#relation-to-its10-and-new-principles" type="specref" + <item>Restructured <q>relation to ITS 1.0 and new principles</q> in <ptr target="#introduction" type="specref" />.</item> <item>Added <ptr target="#queryLanguage" type="specref"/> as a stub.</item> <item>Added <ptr target="#LocaleFilter" type="specref"/>.</item> @@ -6279,7 +6388,7 @@ <list type="ordered"> <item>Clarified <ref target="#introduction">introduction</ref> to cover ITS 2.0</item> <item>Added a subsection on the relation to ITS 1.0 to the introduction, see <ptr - target="#relation-to-its10" type="specref"/></item> + target="#introduction" type="specref"/></item> <item>Created HTML based declarations for various data categories, see e.g. HTML declarations for the Terminology data category and the summary for local data categories in <ptr target="#selection-local" type="specref"/></item> --- /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/its20-for-editing-sec1-sec2.html 2013/05/30 07:53:26 NONE +++ /w3ccvs/WWW/International/multilingualweb/lt/drafts/its20/its20-for-editing-sec1-sec2.html 2013/05/30 07:53:26 1.1 <?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/><title>Internationalization Tag Set (ITS) Version 2.0 -- (Editors' copy)</title><style type="text/css" xml:space="preserve"> </style><link rel="stylesheet" href="local.css" type="text/css"/><link rel="stylesheet" type="text/css" href="base.css"/></head><body><div class="head"> <h1><a name="title" id="title" shape="rect"/>Internationalization Tag Set (ITS) Version 2.0</h1> <h2><a name="w3c-doctype" id="w3c-doctype"/>Editor's Copy</h2><p class="copyright"><a href="http://www.w3.org/Consortium/Legal/ipr-notice#Copyright" shape="rect">Copyright</a> © 2013 <a href="http://www.w3.org/" shape="rect"><acronym title="World Wide Web Consortium">W3C</acronym></a><sup>®</sup> (<a href="http://www.csail.mit.edu/" shape="rect"><acronym title="Massachusetts Institute of Technology">MIT</acronym></a>, <a href="http://www.ercim.eu/" shape="rect"><acronym title="European Research Consortium for Informatics and Mathematics">ERCIM</acronym></a>, <a href="http://www.keio.ac.jp/" shape="rect">Keio</a>, <a href="http://ev.buaa.edu.cn/" shape="rect">Beihang</a>), All Rights Reserved. W3C <a href="http://www.w3.org/Consortium/Legal/ipr-notice#Legal_Disclaimer" shape="rect">liability</a>, <a href="http://www.w3.org/Consortium/Legal/ipr-notice#W3C_Trademarks" shape="rect">trademark</a> and <a href="http://www.w3.org/Consortium/Legal/copyright-documents" shape="rect">document use</a> rules apply.</p>/div><hr/><div> <h2><a name="abstract" id="abstract" shape="rect"/>Abstract</h2><p>The technology described in this document - the <em>Internationalization Tag Set (ITS) 2.0</em> - enhances the foundation to integrate automated processing of human language into core Web technologies. ITS 2.0 bears many commonalities with is predecessor, <a href="http://www.w3.org/TR/2007/REC-its-20070403/" shape="rect">ITS 1.0</a> but provides additional concepts that are designed to foster the automated creation and processing of multilingual Web content. ITS 2.0 focuses on HTML, XML-based formats in general, and can leverage processing based on the XML Localization Interchange File Format (XLIFF), as well as the Natural Language Processing Interchange Format (NIF).</p></div><div> <h2><a name="status" shape="rect">Status of this Document</a></h2><p><strong>This document is an editors' copy that has no official standing.</strong> Last modified: <script type="text/javascript" xml:space="preserve"> document.write(document.lastModified);</script>.</p></div><div class="toc"> <h2><a name="contents" id="contents" shape="rect"/>Table of Contents</h2><div class="toc"><div class="toc1">1 <a href="#introduction" shape="rect">Introduction</a><div class="toc2">1.1 <a href="#overview" shape="rect">Overview</a></div> <div class="toc2">1.2 <a href="#general-motiviation-for-ITS2.0" shape="rect">General motivation for going beyond ITS 1.0</a></div> <div class="toc2">1.3 <a href="#usage-scenarios" shape="rect">Broader Usage Scenarios</a></div> <div class="toc2">1.4 <a href="#high-level-differences-between-1.0-and-2.0" shape="rect">High-level differences between ITS 1.0 and ITS 2.0</a><div class="toc3">1.4.1 <a href="#specific-HTML-support" shape="rect">Specific HTML support</a></div> <div class="toc3">1.4.2 <a href="#additional-data-categories" shape="rect">Additional data categories</a></div> <div class="toc3">1.4.3 <a href="#modified-datacategories" shape="rect">Modified data categories</a></div> <div class="toc3">1.4.4 <a href="#additional-mechanisms" shape="rect">Additional or modified mechanisms</a></div> <div class="toc3">1.4.5 <a href="#mappings" shape="rect">Mappings</a></div> <div class="toc3">1.4.6 <a href="#unicode-normalization" shape="rect">Unicode normalization</a></div> <div class="toc3">1.4.7 <a href="#extended-implementation-hints" shape="rect">Extended implementation hints</a></div> </div> </div> <div class="toc1">2 <a href="#basic-concepts" shape="rect">Basic Concepts</a><div class="toc2">2.1 <a href="#basic-concepts-selection" shape="rect">Selection</a><div class="toc3">2.1.1 <a href="#basic-concepts-selection-local" shape="rect">Local Approach</a></div> <div class="toc3">2.1.2 <a href="#basic-concepts-selection-global" shape="rect">Global Approach</a></div> </div> <div class="toc2">2.2 <a href="#basic-concepts-overinher" shape="rect">Overriding and Inheritance</a></div> <div class="toc2">2.3 <a href="#basic-concepts-addingpointing" shape="rect">Adding Information or Pointing to Existing Information</a></div> </div> <div class="toc1">3 <a href="#notation-terminology" shape="rect">Notation and Terminology</a><div class="toc2">3.1 <a href="#notation" shape="rect">Notation</a></div> <div class="toc2">3.2 <a href="#def-datacat" shape="rect">Data category</a></div> <div class="toc2">3.3 <a href="#def-selection" shape="rect">Selection</a></div> <div class="toc2">3.4 <a href="#def-local-attributes" shape="rect">ITS Local Attributes</a></div> <div class="toc2">3.5 <a href="#def-rule-elements" shape="rect">Rule Elements</a></div> <div class="toc2">3.6 <a href="#iri-usage" shape="rect">Usage of Internationalized Resource Identifiers in ITS</a></div> <div class="toc2">3.7 <a href="#def-html" shape="rect">The Term HTML</a></div> <div class="toc2">3.8 <a href="#def-css-selector" shape="rect">The Term CSS Selectors</a></div> </div> <div class="toc1">4 <a href="#conformance" shape="rect">Conformance</a><div class="toc2">4.1 <a href="#conformance-product-schema" shape="rect">Conformance Type 1: ITS Markup Declarations</a></div> <div class="toc2">4.2 <a href="#conformance-product-processing-expectations" shape="rect">Conformance Type 2: The Processing Expectations for ITS Markup</a></div> <div class="toc2">4.3 <a href="#conformance-product-html-processing-expectations" shape="rect">Conformance Type 3: Processing Expectations for ITS Markup in HTML</a></div> <div class="toc2">4.4 <a href="#conformance-class-html5-its" shape="rect">Conformance Class for HTML5+ITS documents</a></div> </div> <div class="toc1">5 <a href="#its-processing" shape="rect">Processing of ITS information</a><div class="toc2">5.1 <a href="#its-version-attribute" shape="rect">Indicating the Version of ITS</a></div> <div class="toc2">5.2 <a href="#datacategory-locations" shape="rect">Locations of Data Categories</a><div class="toc3">5.2.1 <a href="#selection-global" shape="rect">Global, Rule-based Selection</a></div> <div class="toc3">5.2.2 <a href="#selection-local" shape="rect">Local Selection in an XML Document</a></div> </div> <div class="toc2">5.3 <a href="#selectors" shape="rect">Query Language of Selectors</a><div class="toc3">5.3.1 <a href="#queryLanguage" shape="rect">Choosing Query Language</a></div> <div class="toc3">5.3.2 <a href="#d0e1913" shape="rect">XPath 1.0</a></div> <div class="toc3">5.3.3 <a href="#css-selectors" shape="rect">CSS Selectors</a></div> <div class="toc3">5.3.4 <a href="#d0e2158" shape="rect">Additional query languages</a></div> <div class="toc3">5.3.5 <a href="#its-param" shape="rect">Variables in selectors</a></div> </div> <div class="toc2">5.4 <a href="#link-external-rules" shape="rect">Link to External Rules</a></div> <div class="toc2">5.5 <a href="#selection-precedence" shape="rect">Precedence between Selections</a></div> <div class="toc2">5.6 <a href="#associating-its-with-existing-markup" shape="rect">Associating ITS Data Categories with Existing Markup</a></div> <div class="toc2">5.7 <a href="#conversion-to-nif" shape="rect">Conversion to NIF</a></div> <div class="toc2">5.8 <a href="#its-tool-annotation" shape="rect">ITS Tools Annotation</a></div> </div> <div class="toc1">6 <a href="#html5-markup" shape="rect">Using ITS Markup in HTML</a><div class="toc2">6.1 <a href="#html5-local-attributes" shape="rect">Mapping of Local Data Categories to HTML</a></div> <div class="toc2">6.2 <a href="#html5-global-rules" shape="rect">Global rules</a></div> <div class="toc2">6.3 <a href="#html5-standoff-markup" shape="rect">Standoff Markup in HTML</a></div> <div class="toc2">6.4 <a href="#html5-selection-precedence" shape="rect">Precedence between Selections</a></div> </div> <div class="toc1">7 <a href="#xhtml5-markup" shape="rect">Using ITS Markup in XHTML</a></div> <div class="toc1">8 <a href="#datacategory-description" shape="rect">Description of Data Categories</a><div class="toc2">8.1 <a href="#datacategories-defaults-etc" shape="rect">Position, Defaults, Inheritance and Overriding of Data Categories</a></div> <div class="toc2">8.2 <a href="#trans-datacat" shape="rect">Translate</a><div class="toc3">8.2.1 <a href="#translatability-definition" shape="rect">Definition</a></div> <div class="toc3">8.2.2 <a href="#translatability-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.3 <a href="#locNote-datacat" shape="rect">Localization Note</a><div class="toc3">8.3.1 <a href="#locNote-definition" shape="rect">Definition</a></div> <div class="toc3">8.3.2 <a href="#locNote-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.4 <a href="#terminology" shape="rect">Terminology</a><div class="toc3">8.4.1 <a href="#terminology-definition" shape="rect">Definition</a></div> <div class="toc3">8.4.2 <a href="#terminology-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.5 <a href="#directionality" shape="rect">Directionality</a><div class="toc3">8.5.1 <a href="#directionality-definition" shape="rect">Definition</a></div> <div class="toc3">8.5.2 <a href="#directionality-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.6 <a href="#language-information" shape="rect">Language Information</a><div class="toc3">8.6.1 <a href="#langinfo-definition" shape="rect">Definition</a></div> <div class="toc3">8.6.2 <a href="#langinfo-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.7 <a href="#elements-within-text" shape="rect">Elements Within Text</a><div class="toc3">8.7.1 <a href="#within-text-definition" shape="rect">Definition</a></div> <div class="toc3">8.7.2 <a href="#within-text-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.8 <a href="#domain" shape="rect">Domain</a><div class="toc3">8.8.1 <a href="#domain-definition" shape="rect">Definition</a></div> <div class="toc3">8.8.2 <a href="#domain-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.9 <a href="#textanalysis" shape="rect">Text Analysis</a><div class="toc3">8.9.1 <a href="#textanalysis-definition" shape="rect">Definition</a></div> <div class="toc3">8.9.2 <a href="#textanalysis-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.10 <a href="#LocaleFilter" shape="rect">Locale Filter</a><div class="toc3">8.10.1 <a href="#LocaleFilter-definition" shape="rect">Definition</a></div> <div class="toc3">8.10.2 <a href="#LocaleFilter-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.11 <a href="#provenance" shape="rect">Provenance</a><div class="toc3">8.11.1 <a href="#provenance-definition" shape="rect">Definition</a></div> <div class="toc3">8.11.2 <a href="#provenance-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.12 <a href="#externalresource" shape="rect">External Resource</a><div class="toc3">8.12.1 <a href="#externalresource-definition" shape="rect">Definition</a></div> <div class="toc3">8.12.2 <a href="#externalresource-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.13 <a href="#target-pointer" shape="rect">Target Pointer</a><div class="toc3">8.13.1 <a href="#target-pointer-definition" shape="rect">Definition</a></div> <div class="toc3">8.13.2 <a href="#target-pointer-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.14 <a href="#idvalue" shape="rect">Id Value</a><div class="toc3">8.14.1 <a href="#idvalue-definition" shape="rect">Definition</a></div> <div class="toc3">8.14.2 <a href="#idvalue-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.15 <a href="#preservespace" shape="rect">Preserve Space</a><div class="toc3">8.15.1 <a href="#preservespace-definition" shape="rect">Definition</a></div> <div class="toc3">8.15.2 <a href="#preservespace-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.16 <a href="#lqissue" shape="rect">Localization Quality Issue</a><div class="toc3">8.16.1 <a href="#lqissue-definition" shape="rect">Definition</a></div> <div class="toc3">8.16.2 <a href="#lqissue-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.17 <a href="#lqrating" shape="rect">Localization Quality Rating</a><div class="toc3">8.17.1 <a href="#lqrating-definition" shape="rect">Definition</a></div> <div class="toc3">8.17.2 <a href="#lqrating-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.18 <a href="#mtconfidence" shape="rect">MT Confidence</a><div class="toc3">8.18.1 <a href="#mtconfidence-definition" shape="rect">Definition</a></div> <div class="toc3">8.18.2 <a href="#mtconfidence-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.19 <a href="#allowedchars" shape="rect">Allowed Characters</a><div class="toc3">8.19.1 <a href="#allowedchars-definition" shape="rect">Definition</a></div> <div class="toc3">8.19.2 <a href="#allowedchars-implementation" shape="rect">Implementation</a></div> </div> <div class="toc2">8.20 <a href="#storagesize" shape="rect">Storage Size</a><div class="toc3">8.20.1 <a href="#storagesize-definition" shape="rect">Definition</a></div> <div class="toc3">8.20.2 <a href="#storagesize-implementation" shape="rect">Implementation</a></div> </div> </div> </div> <h3><a name="appendices" id="appendices" shape="rect"/>Appendices</h3><div class="toc1">A <a href="#normative-references" shape="rect">References</a></div> <div class="toc1">B <a href="#its-mime-type" shape="rect">Internationalization Tag Set (ITS) MIME Type</a></div> <div class="toc1">C <a href="#lqissue-typevalues" shape="rect">Values for the Localization Quality Issue Type</a></div> <div class="toc1">D <a href="#its-schemas" shape="rect">Schemas for ITS</a></div> <div class="toc1">E <a href="#informative-references" shape="rect">References</a> (Non-Normative)</div> <div class="toc1">F <a href="#nif-backconversion" shape="rect">Conversion NIF2ITS</a> (Non-Normative)</div> <div class="toc1">G <a href="#list-of-elements-and-attributes" shape="rect">List of ITS 2.0 Global Elements and Local Attributes</a> (Non-Normative)</div> <div class="toc1">H <a href="#revisionlog" shape="rect">Revision Log</a> (Non-Normative)</div> <div class="toc1">I <a href="#acknowledgements" shape="rect">Acknowledgements</a> (Non-Normative)</div> </div><hr/><div class="body"><div class="div1"> <h2><a href="#contents" shape="rect"><img src="images/topOfPage.gif" align="right" height="26" width="26" title="Go to the table of contents." alt="Go to the table of contents."/></a><a name="introduction" id="introduction" shape="rect"/>1 Introduction</h2><div class="div2"> <h3><a href="#contents" shape="rect"><img src="images/topOfPage.gif" align="right" height="26" width="26" title="Go to the table of contents." alt="Go to the table of contents."/></a><a name="overview" id="overview" shape="rect"/>1.1 Overview</h3><p> Content or software that is authored in one language (so-called original language) for one locale (e.g. the French-speaking part of Canada) is often made available in additional languages or adapted with regard to other cultural aspects. A prevailing paradigm for the corresponding approach to production in many cases encompasses [5997 lines skipped]
Received on Thursday, 30 May 2013 07:53:32 UTC