Rollup merge of #44086 - kennytm:htmldocck-python3, r=Mark-Simulacrum

Allow `htmldocck.py` to run using Python 3
author: Corey Farwell <coreyf@rwell.org> 2017-08-26 06:46:35 -0700
committer: GitHub <noreply@github.com> 2017-08-26 06:46:35 -0700
commit: cc5c1e39f475d6b91b85191d4ad3cd32d110cbed (patch)
tree: d0e5b2ef897731c5f753b55b1e369945f055cfa5
parent: 7e8753d1c12b5eec03280c876bafd3423833c5b6 (diff)
parent: 6a721317ff0621a97690dc573ced88274d860e84 (diff)
download: rust-cc5c1e39f475d6b91b85191d4ad3cd32d110cbed.tar.gz
rust-cc5c1e39f475d6b91b85191d4ad3cd32d110cbed.zip
1 files changed, 20 insertions, 13 deletions
diff --git a/src/etc/htmldocck.py b/src/etc/htmldocck.py
index a5449b748dd..7e8fde20346 100644
--- a/src/etc/htmldocck.py
+++ b/src/etc/htmldocck.py
@@ -29,7 +29,7 @@ showing the expected renderings.
 
 In order to avoid one-off dependencies for this task, this script uses
 a reasonably working HTML parser and the existing XPath implementation
-from Python 2's standard library. Hopefully we won't render
+from Python's standard library. Hopefully we won't render
 non-well-formed HTML.
 
 # Commands
@@ -110,11 +110,17 @@ import os.path
 import re
 import shlex
 from collections import namedtuple
-from HTMLParser import HTMLParser
+try:
+    from html.parser import HTMLParser
+except ImportError:
+    from HTMLParser import HTMLParser
 from xml.etree import cElementTree as ET
 
 # &larrb;/&rarrb; are not in HTML 4 but are in HTML 5
-from htmlentitydefs import entitydefs
+try:
+    from html.entities import entitydefs
+except ImportError:
+    from htmlentitydefs import entitydefs
 entitydefs['larrb'] = u'\u21e4'
 entitydefs['rarrb'] = u'\u21e5'
 entitydefs['nbsp'] = ' '
@@ -123,6 +129,11 @@ entitydefs['nbsp'] = ' '
 VOID_ELEMENTS = set(['area', 'base', 'br', 'col', 'embed', 'hr', 'img', 'input', 'keygen',
                      'link', 'menuitem', 'meta', 'param', 'source', 'track', 'wbr'])
 
+# Python 2 -> 3 compatibility
+try:
+    unichr
+except NameError:
+    unichr = chr
 
 class CustomHTMLParser(HTMLParser):
     """simplified HTML parser.
@@ -184,12 +195,8 @@ def concat_multi_lines(f):
 
         # strip the common prefix from the current line if needed
         if lastline is not None:
-            maxprefix = 0
-            for i in xrange(min(len(line), len(lastline))):
-                if line[i] != lastline[i]:
-                    break
-                maxprefix += 1
-            line = line[maxprefix:].lstrip()
+            common_prefix = os.path.commonprefix([line, lastline])
+            line = line[len(common_prefix):].lstrip()
 
         firstlineno = firstlineno or lineno
         if line.endswith('\\'):
@@ -213,7 +220,7 @@ LINE_PATTERN = re.compile(r'''
 
 
 def get_commands(template):
-    with open(template, 'rUb') as f:
+    with open(template, 'rU') as f:
         for lineno, line in concat_multi_lines(f):
             m = LINE_PATTERN.search(line)
             if not m:
@@ -372,7 +379,7 @@ def check_command(c, cache):
                     cache.get_file(c.args[0])
                     ret = True
                 except FailedCheck as err:
-                    cerr = err.message
+                    cerr = str(err)
                     ret = False
             elif len(c.args) == 2: # @has/matches <path> <pat> = string test
                 cerr = "`PATTERN` did not match"
@@ -413,9 +420,9 @@ def check_command(c, cache):
 
     except FailedCheck as err:
         message = '@{}{} check failed'.format('!' if c.negated else '', c.cmd)
-        print_err(c.lineno, c.context, err.message, message)
+        print_err(c.lineno, c.context, str(err), message)
     except InvalidCheck as err:
-        print_err(c.lineno, c.context, err.message)
+        print_err(c.lineno, c.context, str(err))
 
 def check(target, commands):
     cache = CachedFiles(target)
author	Corey Farwell <coreyf@rwell.org>	2017-08-26 06:46:35 -0700
committer	GitHub <noreply@github.com>	2017-08-26 06:46:35 -0700
commit	cc5c1e39f475d6b91b85191d4ad3cd32d110cbed (patch)
tree	d0e5b2ef897731c5f753b55b1e369945f055cfa5
parent	7e8753d1c12b5eec03280c876bafd3423833c5b6 (diff)
parent	6a721317ff0621a97690dc573ced88274d860e84 (diff)
download	rust-cc5c1e39f475d6b91b85191d4ad3cd32d110cbed.tar.gz rust-cc5c1e39f475d6b91b85191d4ad3cd32d110cbed.zip