diff options
author | Victor Stinner <victor.stinner@haypocalc.com> | 2011-05-19 13:18:36 (GMT) |
---|---|---|
committer | Victor Stinner <victor.stinner@haypocalc.com> | 2011-05-19 13:18:36 (GMT) |
commit | cfd365b937a1edaf9da1ac61c2ca6be06fc42744 (patch) | |
tree | ef91befec6370086cffe2ea6c27b4bcee9cca138 /Lib/packaging/command/build_scripts.py | |
parent | 35de5ac44db5c42c792b71077520a6b3ef29b199 (diff) | |
download | cpython-cfd365b937a1edaf9da1ac61c2ca6be06fc42744.zip cpython-cfd365b937a1edaf9da1ac61c2ca6be06fc42744.tar.gz cpython-cfd365b937a1edaf9da1ac61c2ca6be06fc42744.tar.bz2 |
Issue #10419, issue #6011: port 6ad356525381 fix from distutils to packaging
build_scripts command of packaging now handles correctly non-ASCII path (path
to the Python executable). Open and write the script in binary mode, but ensure
that the shebang is decodable from UTF-8 and from the encoding of the script.
Diffstat (limited to 'Lib/packaging/command/build_scripts.py')
-rw-r--r-- | Lib/packaging/command/build_scripts.py | 48 |
1 files changed, 35 insertions, 13 deletions
diff --git a/Lib/packaging/command/build_scripts.py b/Lib/packaging/command/build_scripts.py index 7fba0e5..fe14e0a 100644 --- a/Lib/packaging/command/build_scripts.py +++ b/Lib/packaging/command/build_scripts.py @@ -3,6 +3,7 @@ import os import re import sysconfig +import tokenize from packaging.command.cmd import Command from packaging.util import convert_path, newer @@ -11,7 +12,7 @@ from packaging.compat import Mixin2to3 # check if Python is called on the first line with this expression -first_line_re = re.compile('^#!.*python[0-9.]*([ \t].*)?$') +first_line_re = re.compile(b'^#!.*python[0-9.]*([ \t].*)?$') class build_scripts(Command, Mixin2to3): @@ -76,12 +77,14 @@ class build_scripts(Command, Mixin2to3): # that way, we'll get accurate feedback if we can read the # script. try: - f = open(script, "r") + f = open(script, "rb") except IOError: if not self.dry_run: raise f = None else: + encoding, lines = tokenize.detect_encoding(f.readline) + f.seek(0) first_line = f.readline() if not first_line: logger.warning('%s: %s is an empty file (skipping)', @@ -91,26 +94,45 @@ class build_scripts(Command, Mixin2to3): match = first_line_re.match(first_line) if match: adjust = True - post_interp = match.group(1) or '' + post_interp = match.group(1) or b'' if adjust: logger.info("copying and adjusting %s -> %s", script, self.build_dir) if not self.dry_run: - outf = open(outfile, "w") if not sysconfig.is_python_build(): - outf.write("#!%s%s\n" % - (self.executable, - post_interp)) + executable = self.executable else: - outf.write("#!%s%s\n" % - (os.path.join( + executable = os.path.join( sysconfig.get_config_var("BINDIR"), "python%s%s" % (sysconfig.get_config_var("VERSION"), - sysconfig.get_config_var("EXE"))), - post_interp)) - outf.writelines(f.readlines()) - outf.close() + sysconfig.get_config_var("EXE"))) + executable = os.fsencode(executable) + shebang = b"#!" + executable + post_interp + b"\n" + # Python parser starts to read a script using UTF-8 until + # it gets a #coding:xxx cookie. The shebang has to be the + # first line of a file, the #coding:xxx cookie cannot be + # written before. So the shebang has to be decodable from + # UTF-8. + try: + shebang.decode('utf-8') + except UnicodeDecodeError: + raise ValueError( + "The shebang ({!r}) is not decodable " + "from utf-8".format(shebang)) + # If the script is encoded to a custom encoding (use a + # #coding:xxx cookie), the shebang has to be decodable from + # the script encoding too. + try: + shebang.decode(encoding) + except UnicodeDecodeError: + raise ValueError( + "The shebang ({!r}) is not decodable " + "from the script encoding ({})" + .format(shebang, encoding)) + with open(outfile, "wb") as outf: + outf.write(shebang) + outf.writelines(f.readlines()) if f: f.close() else: |