diff options
author | Greg Ward <gward@python.net> | 2000-02-17 23:56:15 (GMT) |
---|---|---|
committer | Greg Ward <gward@python.net> | 2000-02-17 23:56:15 (GMT) |
commit | a82122b8875a8bef0422dc236a6c4a9dadc5e417 (patch) | |
tree | aa7550d0a892d657314718e0a0b30e45219d560d /Lib/distutils/command | |
parent | 3d6b023f5cf7801a6db44cd943f810fa595730fe (diff) | |
download | cpython-a82122b8875a8bef0422dc236a6c4a9dadc5e417.zip cpython-a82122b8875a8bef0422dc236a6c4a9dadc5e417.tar.gz cpython-a82122b8875a8bef0422dc236a6c4a9dadc5e417.tar.bz2 |
The 'sdist' command to create a source distribution. This is derived from the
old 'dist' command, but the code for dealing with manifests is completely
redone -- and renaming the command to 'sdist' is more symmetric with the
soon-to-exist 'bdist' command.
Diffstat (limited to 'Lib/distutils/command')
-rw-r--r-- | Lib/distutils/command/sdist.py | 716 |
1 files changed, 716 insertions, 0 deletions
diff --git a/Lib/distutils/command/sdist.py b/Lib/distutils/command/sdist.py new file mode 100644 index 0000000..c8101a7 --- /dev/null +++ b/Lib/distutils/command/sdist.py @@ -0,0 +1,716 @@ +"""distutils.command.sdist + +Implements the Distutils 'sdist' command (create a source distribution).""" + +# created 1999/09/22, Greg Ward + +__rcsid__ = "$Id$" + +import sys, os, string, re +import fnmatch +from types import * +from glob import glob +from shutil import rmtree +from distutils.core import Command +from distutils.util import newer +from distutils.text_file import TextFile +from distutils.errors import DistutilsExecError + + +class Sdist (Command): + + description = "create a source distribution (tarball, zip file, etc.)" + + options = [('template=', 't', + "name of manifest template file [default: MANIFEST.in]"), + ('manifest=', 'm', + "name of manifest file [default: MANIFEST]"), + ('use-defaults', None, + "include the default file set in the manifest " + "[default; disable with --no-defaults]"), + ('manifest-only', None, + "just regenerate the manifest and then stop"), + ('force-manifest', None, + "forcibly regenerate the manifest and carry on as usual"), + + ('formats=', None, + "formats for source distribution (tar, ztar, gztar, or zip)"), + ('list-only', 'l', + "just list files that would be distributed"), + ('keep-tree', 'k', + "keep the distribution tree around after creating " + + "archive file(s)"), + ] + negative_opts = {'use-defaults': 'no-defaults'} + + default_format = { 'posix': 'gztar', + 'nt': 'zip' } + + exclude_re = re.compile (r'\s*!\s*(\S+)') # for manifest lines + + + def set_default_options (self): + # 'template' and 'manifest' are, respectively, the names of + # the manifest template and manifest file. + self.template = None + self.manifest = None + + # 'use_defaults': if true, we will include the default file set + # in the manifest + self.use_defaults = 1 + + self.manifest_only = 0 + self.force_manifest = 0 + + self.formats = None + self.list_only = 0 + self.keep_tree = 0 + + + def set_final_options (self): + if self.manifest is None: + self.manifest = "MANIFEST" + if self.template is None: + self.template = "MANIFEST.in" + + if self.formats is None: + try: + self.formats = [self.default_format[os.name]] + except KeyError: + raise DistutilsPlatformError, \ + "don't know how to build source distributions on " + \ + "%s platform" % os.name + elif type (self.formats) is StringType: + self.formats = string.split (self.formats, ',') + + + def run (self): + + # 'files' is the list of files that will make up the manifest + self.files = [] + + # Ensure that all required meta-data is given; warn if not (but + # don't die, it's not *that* serious!) + self.check_metadata () + + # Do whatever it takes to get the list of files to process + # (process the manifest template, read an existing manifest, + # whatever). File list is put into 'self.files'. + self.get_file_list () + + # If user just wanted us to regenerate the manifest, stop now. + if self.manifest_only: + return + + # Otherwise, go ahead and create the source distribution tarball, + # or zipfile, or whatever. + self.make_distribution () + + + def check_metadata (self): + + dist = self.distribution + + missing = [] + for attr in ('name', 'version', 'url'): + if not (hasattr (dist, attr) and getattr (dist, attr)): + missing.append (attr) + + if missing: + self.warn ("missing required meta-data: " + + string.join (missing, ", ")) + + if dist.author: + if not dist.author_email: + self.warn ("missing meta-data: if 'author' supplied, " + + "'author_email' must be supplied too") + elif dist.maintainer: + if not dist.maintainer_email: + self.warn ("missing meta-data: if 'maintainer' supplied, " + + "'maintainer_email' must be supplied too") + else: + self.warn ("missing meta-data: either (author and author_email) " + + "or (maintainer and maintainer_email) " + + "must be supplied") + + # check_metadata () + + + def get_file_list (self): + """Figure out the list of files to include in the source + distribution, and put it in 'self.files'. This might + involve reading the manifest template (and writing the + manifest), or just reading the manifest, or just using + the default file set -- it all depends on the user's + options and the state of the filesystem.""" + + + template_exists = os.path.isfile (self.template) + if template_exists: + template_newer = newer (self.template, self.manifest) + + # Regenerate the manifest if necessary (or if explicitly told to) + if ((template_exists and template_newer) or + self.force_manifest or + self.manifest_only): + + if not template_exists: + self.warn (("manifest template '%s' does not exist " + + "(using default file list)") % + self.template) + + # Add default file set to 'files' + if self.use_defaults: + self.find_defaults () + + # Read manifest template if it exists + if template_exists: + self.read_template () + + # File list now complete -- sort it so that higher-level files + # come first + sortable_files = map (os.path.split, self.files) + sortable_files.sort () + self.files = [] + for sort_tuple in sortable_files: + self.files.append (apply (os.path.join, sort_tuple)) + + # Remove duplicates from the file list + for i in range (len(self.files)-1, 0, -1): + if self.files[i] == self.files[i-1]: + del self.files[i] + + # And write complete file list (including default file set) to + # the manifest. + self.write_manifest () + + # Don't regenerate the manifest, just read it in. + else: + self.read_manifest () + + # get_file_list () + + + def find_defaults (self): + + standards = [('README', 'README.txt'), 'setup.py'] + for fn in standards: + if type (fn) is TupleType: + alts = fn + for fn in alts: + if os.path.exists (fn): + got_it = 1 + self.files.append (fn) + break + + if not got_it: + self.warn ("standard file not found: should have one of " + + string.join (alts, ', ')) + else: + if os.path.exists (fn): + self.files.append (fn) + else: + self.warn ("standard file '%s' not found" % fn) + + optional = ['test/test*.py'] + for pattern in optional: + files = filter (os.path.isfile, glob (pattern)) + if files: + self.files.extend (files) + + if self.distribution.packages or self.distribution.py_modules: + build_py = self.find_peer ('build_py') + build_py.ensure_ready () + self.files.extend (build_py.get_source_files ()) + + if self.distribution.ext_modules: + build_ext = self.find_peer ('build_ext') + build_ext.ensure_ready () + self.files.extend (build_ext.get_source_files ()) + + + + def search_dir (self, dir, pattern=None): + """Recursively find files under 'dir' matching 'pattern' (a string + containing a Unix-style glob pattern). If 'pattern' is None, + find all files under 'dir'. Return the list of found + filenames.""" + + allfiles = findall (dir) + if pattern is None: + return allfiles + + pattern_re = translate_pattern (pattern) + files = [] + for file in allfiles: + if pattern_re.match (os.path.basename (file)): + files.append (file) + + return files + + # search_dir () + + + def exclude_pattern (self, pattern): + """Remove filenames from 'self.files' that match 'pattern'.""" + print "exclude_pattern: pattern=%s" % pattern + pattern_re = translate_pattern (pattern) + for i in range (len (self.files)-1, -1, -1): + if pattern_re.match (self.files[i]): + print "removing %s" % self.files[i] + del self.files[i] + + + def recursive_exclude_pattern (self, dir, pattern=None): + """Remove filenames from 'self.files' that are under 'dir' + and whose basenames match 'pattern'.""" + + print "recursive_exclude_pattern: dir=%s, pattern=%s" % (dir, pattern) + if pattern is None: + pattern_re = None + else: + pattern_re = translate_pattern (pattern) + + for i in range (len (self.files)-1, -1, -1): + (cur_dir, cur_base) = os.path.split (self.files[i]) + if (cur_dir == dir and + (pattern_re is None or pattern_re.match (cur_base))): + print "removing %s" % self.files[i] + del self.files[i] + + + def read_template (self): + """Read and parse the manifest template file named by + 'self.template' (usually "MANIFEST.in"). Process all file + specifications (include and exclude) in the manifest template + and add the resulting filenames to 'self.files'.""" + + assert self.files is not None and type (self.files) is ListType + + template = TextFile (self.template, + strip_comments=1, + skip_blanks=1, + join_lines=1, + lstrip_ws=1, + rstrip_ws=1, + collapse_ws=1) + + all_files = findall () + + while 1: + + line = template.readline() + if line is None: # end of file + break + + words = string.split (line) + action = words[0] + + # First, check that the right number of words are present + # for the given action (which is the first word) + if action in ('include','exclude', + 'global-include','global-exclude'): + if len (words) != 2: + template.warn \ + ("invalid manifest template line: " + + "'%s' expects a single <pattern>" % + action) + continue + + pattern = words[1] + + elif action in ('recursive-include','recursive-exclude'): + if len (words) != 3: + template.warn \ + ("invalid manifest template line: " + + "'%s' expects <dir> <pattern>" % + action) + continue + + (dir, pattern) = words[1:3] + + elif action in ('graft','prune'): + if len (words) != 2: + template.warn \ + ("invalid manifest template line: " + + "'%s' expects a single <dir_pattern>" % + action) + continue + + dir_pattern = words[1] + + else: + template.warn ("invalid manifest template line: " + + "unknown action '%s'" % action) + continue + + # OK, now we know that the action is valid and we have the + # right number of words on the line for that action -- so we + # can proceed with minimal error-checking. Also, we have + # defined either 'patter', 'dir' and 'pattern', or + # 'dir_pattern' -- so we don't have to spend any time digging + # stuff up out of 'words'. + + if action == 'include': + print "include", pattern + files = select_pattern (all_files, pattern, anchor=1) + if not files: + template.warn ("no files found matching '%s'" % pattern) + else: + self.files.extend (files) + + elif action == 'exclude': + print "exclude", pattern + num = exclude_pattern (self.files, pattern, anchor=1) + if num == 0: + template.warn \ + ("no previously-included files found matching '%s'" % + pattern) + + elif action == 'global-include': + print "global-include", pattern + files = select_pattern (all_files, pattern, anchor=0) + if not files: + template.warn (("no files found matching '%s' " + + "anywhere in distribution") % + pattern) + else: + self.files.extend (files) + + elif action == 'global-exclude': + print "global-exclude", pattern + num = exclude_pattern (self.files, pattern, anchor=0) + if num == 0: + template.warn \ + (("no previously-included files matching '%s' " + + "found anywhere in distribution") % + pattern) + + elif action == 'recursive-include': + print "recursive-include", dir, pattern + files = select_pattern (all_files, pattern, prefix=dir) + if not files: + template.warn (("no files found matching '%s' " + + "under directory '%s'") % + (pattern, dir)) + else: + self.files.extend (files) + + elif action == 'recursive-exclude': + print "recursive-exclude", dir, pattern + num = exclude_pattern (self.files, pattern, prefix=dir) + if num == 0: + template.warn \ + (("no previously-included files matching '%s' " + + "found under directory '%s'") % + (pattern, dir)) + + elif action == 'graft': + print "graft", dir_pattern + files = select_pattern (all_files, None, prefix=dir_pattern) + if not files: + template.warn ("no directories found matching '%s'" % + dir_pattern) + else: + self.files.extend (files) + + elif action == 'prune': + print "prune", dir_pattern + num = exclude_pattern (self.files, None, prefix=dir_pattern) + if num == 0: + template.warn \ + (("no previously-included directories found " + + "matching '%s'") % + dir_pattern) + else: + raise RuntimeError, \ + "this cannot happen: invalid action '%s'" % action + + # while loop over lines of template file + + # read_template () + + + def write_manifest (self): + """Write the file list in 'self.files' (presumably as filled in + by 'find_defaults()' and 'read_template()') to the manifest file + named by 'self.manifest'.""" + + manifest = open (self.manifest, "w") + for fn in self.files: + manifest.write (fn + '\n') + manifest.close () + + # write_manifest () + + + def read_manifest (self): + """Read the manifest file (named by 'self.manifest') and use + it to fill in 'self.files', the list of files to include + in the source distribution.""" + + manifest = open (self.manifest) + while 1: + line = manifest.readline () + if line == '': # end of file + break + if line[-1] == '\n': + line = line[0:-1] + self.files.append (line) + + # read_manifest () + + + + def make_release_tree (self, base_dir, files): + + # First get the list of directories to create + need_dir = {} + for file in files: + need_dir[os.path.join (base_dir, os.path.dirname (file))] = 1 + need_dirs = need_dir.keys() + need_dirs.sort() + + # Now create them + for dir in need_dirs: + self.mkpath (dir) + + # And walk over the list of files, either making a hard link (if + # os.link exists) to each one that doesn't already exist in its + # corresponding location under 'base_dir', or copying each file + # that's out-of-date in 'base_dir'. (Usually, all files will be + # out-of-date, because by default we blow away 'base_dir' when + # we're done making the distribution archives.) + + try: + link = os.link + msg = "making hard links in %s..." % base_dir + except AttributeError: + link = 0 + msg = "copying files to %s..." % base_dir + + self.announce (msg) + for file in files: + dest = os.path.join (base_dir, file) + if link: + if not os.path.exists (dest): + self.execute (os.link, (file, dest), + "linking %s -> %s" % (file, dest)) + else: + self.copy_file (file, dest) + + # make_release_tree () + + + def nuke_release_tree (self, base_dir): + try: + self.execute (rmtree, (base_dir,), + "removing %s" % base_dir) + except (IOError, OSError), exc: + if exc.filename: + msg = "error removing %s: %s (%s)" % \ + (base_dir, exc.strerror, exc.filename) + else: + msg = "error removing %s: %s" % (base_dir, exc.strerror) + self.warn (msg) + + + def make_tarball (self, base_dir, compress="gzip"): + + # XXX GNU tar 1.13 has a nifty option to add a prefix directory. + # It's pretty new, though, so we certainly can't require it -- + # but it would be nice to take advantage of it to skip the + # "create a tree of hardlinks" step! (Would also be nice to + # detect GNU tar to use its 'z' option and save a step.) + + if compress is not None and compress not in ('gzip', 'compress'): + raise ValueError, \ + "if given, 'compress' must be 'gzip' or 'compress'" + + archive_name = base_dir + ".tar" + self.spawn (["tar", "-cf", archive_name, base_dir]) + + if compress: + self.spawn ([compress, archive_name]) + + + def make_zipfile (self, base_dir): + + # This initially assumed the Unix 'zip' utility -- but + # apparently InfoZIP's zip.exe works the same under Windows, so + # no changes needed! + + try: + self.spawn (["zip", "-r", base_dir + ".zip", base_dir]) + except DistutilsExecError: + + # XXX really should distinguish between "couldn't find + # external 'zip' command" and "zip failed" -- shouldn't try + # again in the latter case. (I think fixing this will + # require some cooperation from the spawn module -- perhaps + # a utility function to search the path, so we can fallback + # on zipfile.py without the failed spawn.) + try: + import zipfile + except ImportError: + raise DistutilsExecError, \ + ("unable to create zip file '%s.zip': " + + "could neither find a standalone zip utility nor " + + "import the 'zipfile' module") % base_dir + + z = zipfile.ZipFile (base_dir + ".zip", "wb", + compression=zipfile.ZIP_DEFLATED) + + def visit (z, dirname, names): + for name in names: + path = os.path.join (dirname, name) + if os.path.isfile (path): + z.write (path, path) + + os.path.walk (base_dir, visit, z) + z.close() + + + def make_distribution (self): + + # Don't warn about missing meta-data here -- should be done + # elsewhere. + name = self.distribution.name or "UNKNOWN" + version = self.distribution.version + + if version: + base_dir = "%s-%s" % (name, version) + else: + base_dir = name + + # Remove any files that match "base_dir" from the fileset -- we + # don't want to go distributing the distribution inside itself! + self.exclude_pattern (base_dir + "*") + + self.make_release_tree (base_dir, self.files) + for fmt in self.formats: + if fmt == 'gztar': + self.make_tarball (base_dir, compress='gzip') + elif fmt == 'ztar': + self.make_tarball (base_dir, compress='compress') + elif fmt == 'tar': + self.make_tarball (base_dir, compress=None) + elif fmt == 'zip': + self.make_zipfile (base_dir) + + if not self.keep_tree: + self.nuke_release_tree (base_dir) + +# class Dist + + +# ---------------------------------------------------------------------- +# Utility functions + +def findall (dir = os.curdir): + """Find all files under 'dir' and return the list of full + filenames (relative to 'dir').""" + + list = [] + stack = [dir] + pop = stack.pop + push = stack.append + + while stack: + dir = pop() + names = os.listdir (dir) + + for name in names: + if dir != os.curdir: # avoid the dreaded "./" syndrome + fullname = os.path.join (dir, name) + else: + fullname = name + list.append (fullname) + if os.path.isdir (fullname) and not os.path.islink(fullname): + push (fullname) + + return list + + +def select_pattern (files, pattern, anchor=1, prefix=None): + """Select strings (presumably filenames) from 'files' that match + 'pattern', a Unix-style wildcard (glob) pattern. Patterns are not + quite the same as implemented by the 'fnmatch' module: '*' and '?' + match non-special characters, where "special" is platform-dependent: + slash on Unix, colon, slash, and backslash on DOS/Windows, and colon + on Mac OS. + + If 'anchor' is true (the default), then the pattern match is more + stringent: "*.py" will match "foo.py" but not "foo/bar.py". If + 'anchor' is false, both of these will match. + + If 'prefix' is supplied, then only filenames starting with 'prefix' + (itself a pattern) and ending with 'pattern', with anything in + between them, will match. 'anchor' is ignored in this case. + + Return the list of matching strings, possibly empty.""" + + matches = [] + pattern_re = translate_pattern (pattern, anchor, prefix) + print "select_pattern: applying re %s" % pattern_re.pattern + for name in files: + if pattern_re.search (name): + matches.append (name) + print " adding", name + + return matches + +# select_pattern () + + +def exclude_pattern (files, pattern, anchor=1, prefix=None): + + pattern_re = translate_pattern (pattern, anchor, prefix) + print "exclude_pattern: applying re %s" % pattern_re.pattern + for i in range (len(files)-1, -1, -1): + if pattern_re.search (files[i]): + print " removing", files[i] + del files[i] + +# exclude_pattern () + + +def glob_to_re (pattern): + """Translate a shell-like glob pattern to a regular expression; + return a string containing the regex. Differs from + 'fnmatch.translate()' in that '*' does not match "special + characters" (which are platform-specific).""" + pattern_re = fnmatch.translate (pattern) + + # '?' and '*' in the glob pattern become '.' and '.*' in the RE, which + # IMHO is wrong -- '?' and '*' aren't supposed to match slash in Unix, + # and by extension they shouldn't match such "special characters" under + # any OS. So change all non-escaped dots in the RE to match any + # character except the special characters. + # XXX currently the "special characters" are just slash -- i.e. this is + # Unix-only. + pattern_re = re.sub (r'(^|[^\\])\.', r'\1[^/]', pattern_re) + return pattern_re + +# glob_to_re () + + +def translate_pattern (pattern, anchor=1, prefix=None): + """Translate a shell-like wildcard pattern to a compiled regular + expression. Return the compiled regex.""" + + if pattern: + pattern_re = glob_to_re (pattern) + else: + pattern_re = '' + + if prefix is not None: + prefix_re = (glob_to_re (prefix))[0:-1] # ditch trailing $ + pattern_re = "^" + os.path.join (prefix_re, ".*" + pattern_re) + else: # no prefix -- respect anchor flag + if anchor: + pattern_re = "^" + pattern_re + + return re.compile (pattern_re) + +# translate_pattern () |