googlecode_upload.py   [plain text]


#!/usr/bin/env python
#
# Copyright 2006, 2007 Google Inc. All Rights Reserved.
# Author: danderson@google.com (David Anderson)
#
# Modifications for distcc Copyright 2008 Google Inc.
# Author: Craig Silverstein.
#
# Script for uploading files to a Google Code project.
#
# This is intended to be both a useful script for people who want to
# streamline project uploads and a reference implementation for
# uploading files to Google Code projects.
#
# To upload a file to Google Code, you need to provide a path to the
# file on your local machine, a small summary of what the file is, a
# project name, and a valid account that is a member or owner of that
# project.  You can optionally provide a list of labels that apply to
# the file.  The file will be uploaded under the same name that it has
# in your local filesystem (that is, the "basename" or last path
# component).  Run the script with '--help' to get the exact syntax
# and available options.
#
# Note that the upload script requests that you enter your
# googlecode.com password.  This is NOT your Gmail account password!
# This is the password you use on googlecode.com for committing to
# Subversion and uploading files.  You can find your password by going
# to http://code.google.com/hosting/settings when logged in with your
# Gmail account. If you have already committed to your project's
# Subversion repository, the script will automatically retrieve your
# credentials from there (unless disabled, see the output of '--help'
# for details).
#
# If you are looking at this script as a reference for implementing
# your own Google Code file uploader, then you should take a look at
# the upload() function, which is the meat of the uploader.  You
# basically need to build a multipart/form-data POST request with the
# right fields and send it to https://PROJECT.googlecode.com/files .
# Authenticate the request using HTTP Basic authentication, as is
# shown below.
#
# Licensed under the terms of the Apache Software License 2.0:
#  http://www.apache.org/licenses/LICENSE-2.0
#
# Questions, comments, feature requests and patches are most welcome.
# Please direct all of these to the Google Code users group:
#  http://groups.google.com/group/google-code-hosting

"""Google Code file uploader script.
"""

__author__ = 'danderson@google.com (David Anderson)'

import httplib
import os.path
import optparse
import getpass
import base64
import sys
import re


def extract_version(project, file_paths):
  """Given a list of filenames belonging to a given Google Code
  project, derive from that the version number.  Do this by looking
  for a .tar.gz, .tgz. .tar.bz2, or .zip file, and assume those are
  named <project>-<version>.<extension>.  Verify by making sure
  <project> and <version> are substrings in all given files.

  Returns version, or empty string if couldn't figure it out.
  """
  for file_path in file_paths:
    m = re.match(r'%s-([0-9]+\.[0-9]+.*)\.(tar\.gz|tgz|tar\.bz2|zip)' % project,
                 os.path.basename(file_path), re.I)
    if m:
      version = m.group(1)
      break
  else:    # for ended without finding anything
    return ''

  # Now verify the project and version are everywhere
  for file_path in file_paths:
    if file_path.find(version) == -1:
      return ''

  return version

def derive_summary_and_labels(file_path, package, version):
  """Derive a summary associated with a file given some file information.

  Returns (summary, list_of_labels).  Raises ValueError if there was
  a problem figuring out the summary.

  Given a filename like google_perftools-0.94.rpm, this function would derive
  * summary = "RPM for google_perftools 0.94"
  * labels = ["Type-Package", "OpSys-Linux"]
  """
  if file_path.find('distcc-server') != -1:
    project = 'Distcc server (distccd)'
  elif file_path.find('distcc') != -1:
    if file_path.find('.tar') != -1:
      # The source distribution has both client and server
      project = 'Distcc (both client and server)'
    else:
      project = 'Distcc client (distcc)'
  else:
    raise ValueError("Unknown project name for '%s'" % file_path)

  if (file_path.endswith('.tar.gz') or file_path.endswith('.tgz') or
      file_path.endswith('.tar.bz2')):
    return ('Tarball for %s %s' % (project, version),
            ('Type-Source', 'OpSys-All'))

  if file_path.endswith('.zip'):
    return ('Zip file for %s %s' % (project, version),
            ('Type-Source', 'OpSys-Windows'))

  if file_path.endswith('.deb') and file_path.find('-dev_') != -1:
    return ('Development deb for %s %s' % (project, version),
            ('Type-Package', 'OpSys-Linux'))

  if file_path.endswith('.deb'):
    return ('Deb for %s %s' % (project, version),
            ('Type-Package', 'OpSys-Linux'))

  if file_path.endswith('.src.rpm') and file_path.find('-devel-') != -1:
    return ('Source-code RPM for %s %s' % (project, version),
            ('Type-Package', 'OpSys-Linux'))

  if file_path.endswith('.rpm') and file_path.find('-devel-') != -1:
    return ('Development RPM for %s %s' % (project, version),
            ('Type-Package', 'OpSys-Linux'))

  if file_path.endswith('.rpm'):
    return ('RPM for %s %s' % (project, version),
            ('Type-Package', 'OpSys-Linux'))

  raise ValueError("Unknown file extension for '%s'" % file_path)

def get_svn_config_dir():
  """Return user's Subversion configuration directory."""
  try:
    from win32com.shell.shell import SHGetFolderPath
    import win32com.shell.shellcon
  except ImportError:
    # If we can't import the win32api, just use ~; this is right on unix, and
    # returns not entirely unreasonable results on Windows.
    return os.path.expanduser('~/.subversion')

  # We're on Windows with win32api; use APPDATA.
  return os.path.join(SHGetFolderPath(0, win32com.shell.shellcon.CSIDL_APPDATA,
                                      0, 0).encode('utf-8'),
                      'Subversion')


def get_svn_auth(project_name, config_dir):
  """Return (username, password) for project_name in config_dir."""

  # Default to returning nothing.
  result = (None, None)

  try:
    from svn.core import SVN_AUTH_CRED_SIMPLE, svn_config_read_auth_data
    from svn.core import SubversionException
  except ImportError:
    return result

  realm = ('<https://%s.googlecode.com:443> Google Code Subversion Repository'
           % project_name)

  # auth may be none even if no exception is raised, e.g. if config_dir does
  # not exist, or exists but has no entry for realm.
  try:
    auth = svn_config_read_auth_data(SVN_AUTH_CRED_SIMPLE, realm, config_dir)
  except SubversionException:
    auth = None

  if auth is not None:
    try:
      result = (auth['username'], auth['password'])
    except KeyError:
      # Missing the keys, so return nothing.
      pass

  return result


def upload(file, project_name, user_name, password, summary, labels=None):
  """Upload a file to a Google Code project's file server.

  Args:
    file: The local path to the file.
    project_name: The name of your project on Google Code.
    user_name: Your Google account name.
    password: The googlecode.com password for your account.
              Note that this is NOT your global Google Account password!
    summary: A small description for the file.
    labels: an optional list of label strings with which to tag the file.

  Returns: a tuple:
    http_status: 201 if the upload succeeded, something else if an
                 error occured.
    http_reason: The human-readable string associated with http_status
    file_url: If the upload succeeded, the URL of the file on Google
              Code, None otherwise.
  """
  # The login is the user part of user@gmail.com. If the login provided
  # is in the full user@domain form, strip it down.
  if '@' in user_name:
    user_name = user_name[:user_name.index('@')]

  form_fields = [('summary', summary)]
  if labels is not None:
    form_fields.extend([('label', l.strip()) for l in labels])

  content_type, body = encode_upload_request(form_fields, file)

  upload_host = '%s.googlecode.com' % project_name
  upload_uri = '/files'
  auth_token = base64.b64encode('%s:%s'% (user_name, password))
  headers = {
    'Authorization': 'Basic %s' % auth_token,
    'User-Agent': 'Googlecode.com uploader v0.9.4',
    'Content-Type': content_type,
    }

  server = httplib.HTTPSConnection(upload_host)
  server.request('POST', upload_uri, body, headers)
  resp = server.getresponse()
  server.close()

  if resp.status == 201:
    location = resp.getheader('Location', None)
  else:
    location = None
  return resp.status, resp.reason, location


def encode_upload_request(fields, file_path):
  """Encode the given fields and file into a multipart form body.

  fields is a sequence of (name, value) pairs. file is the path of
  the file to upload. The file will be uploaded to Google Code with
  the same file name.

  Returns: (content_type, body) ready for httplib.HTTP instance
  """
  BOUNDARY = '----------Googlecode_boundary_reindeer_flotilla'
  CRLF = '\r\n'

  body = []

  # Add the metadata about the upload first
  for key, value in fields:
    body.extend(
      ['--' + BOUNDARY,
       'Content-Disposition: form-data; name="%s"' % key,
       '',
       value,
       ])

  # Now add the file itself
  file_name = os.path.basename(file_path)
  f = open(file_path, 'rb')
  file_content = f.read()
  f.close()

  body.extend(
    ['--' + BOUNDARY,
     'Content-Disposition: form-data; name="filename"; filename="%s"'
     % file_name,
     # The upload server determines the mime-type, no need to set it.
     'Content-Type: application/octet-stream',
     '',
     file_content,
     ])

  # Finalize the form body
  body.extend(['--' + BOUNDARY + '--', ''])

  return 'multipart/form-data; boundary=%s' % BOUNDARY, CRLF.join(body)


def upload_find_auth(file_path, project_name, summary, labels=None,
                     config_dir=None, user_name=None, tries=3):
  """Find credentials and upload a file to a Google Code project's file server.

  file_path, project_name, summary, and labels are passed as-is to upload.

  If config_dir is None, try get_svn_config_dir(); if it is 'none', skip
  trying the Subversion configuration entirely.  If user_name is not None, use
  it for the first attempt; prompt for subsequent attempts.

  Args:
    file_path: The local path to the file.
    project_name: The name of your project on Google Code.
    summary: A small description for the file.
    labels: an optional list of label strings with which to tag the file.
    config_dir: Path to Subversion configuration directory, 'none', or None.
    user_name: Your Google account name.
    tries: How many attempts to make.
  """

  if config_dir != 'none':
    # Try to load username/password from svn config for first try.
    if config_dir is None:
      config_dir = get_svn_config_dir()
    (svn_username, password) = get_svn_auth(project_name, config_dir)
    if user_name is None:
      # If username was not supplied by caller, use svn config.
      user_name = svn_username
  else:
    # Just initialize password for the first try.
    password = None

  while tries > 0:
    if user_name is None:
      # Read username if not specified or loaded from svn config, or on
      # subsequent tries.
      sys.stdout.write('Please enter your googlecode.com username: ')
      sys.stdout.flush()
      user_name = sys.stdin.readline().rstrip()
    if password is None:
      # Read password if not loaded from svn config, or on subsequent tries.
      print 'Please enter your googlecode.com password.'
      print '** Note that this is NOT your Gmail account password! **'
      print 'It is the password you use to access Subversion repositories.'
      prompt = 'Password (listed at http://code.google.com/hosting/settings): '
      password = getpass.getpass(prompt)

    status, reason, url = upload(file_path, project_name, user_name, password,
                                 summary, labels)
    # Returns 403 Forbidden instead of 401 Unauthorized for bad
    # credentials as of 2007-07-17.
    if status in [httplib.FORBIDDEN, httplib.UNAUTHORIZED]:
      # Rest for another try.
      user_name = password = None
      tries = tries - 1
    else:
      # We're done.
      break

  return status, reason, url


def main():
  parser = optparse.OptionParser(usage='googlecode-upload.py -s SUMMARY '
                                 '-p PROJECT [options] FILE [FILE] ...')
  parser.add_option('--config-dir', dest='config_dir', metavar='DIR',
                    help='read svn auth data from DIR'
                         ' ("none" means not to use svn auth data)')
  parser.add_option('-s', '--summary', dest='summary',
                    help='Short description of the file'
                         ' (if not set, description will derive from filename)')
  parser.add_option('-u', '--user', dest='user',
                    help='Your Google Code username'
                         ' (if not set, the program will prompt you)')
  parser.add_option('-l', '--labels', dest='labels',
                    help='An optional list of labels to attach to the file'
                         ' (if not set, labels will derive from filename)')

  options, args = parser.parse_args()

  if not args:
    parser.error('File(s) to upload not provided.')

  project = 'distcc'   # We hard-code that. :-)

  if options.labels:
    user_labels = options.labels.split(',')
  else:
    user_labels = None

  default_user = os.environ.get('USER', 'unknown')
  if options.user:
    user = options.user
  else:
    print 'Enter username (<enter> takes the default of "%s"):' % default_user,
    user = raw_input() or default_user

  prompt = 'Password (listed at http://code.google.com/hosting/settings): '
  password = getpass.getpass(prompt)

  version = extract_version(project, args)

  successes = 0
  failures = 0

  for file_path in args:
    # If the user did not specify the summary or labels, derive these
    # from the filename.
    try:
      (derived_summary, derived_labels) = \
          derive_summary_and_labels(file_path, project, version)
    except ValueError, why:
      print "%s" % why
      failures += 1
      continue

    summary = options.summary or derived_summary
    labels = user_labels or derived_labels

    # The find_auth functionality is currently broken; see
    # http://code.google.com/p/support/issues/detail?id=558
    # This is why we asked for the password/username above.
    ## status, reason, url = upload_find_auth(file_path, options.project,
    ##                                        options.summary, labels,
    ##                                        options.config_dir, options.user)
    status, reason, url = upload(file_path, project, user, password,
                                 summary, labels)

    if url:
      print '%s was uploaded successfully.' % file_path
      print 'URL: %s' % url
      print
      successes += 1
    else:
      print 'An error occurred. %s was not uploaded.' % file_path
      print 'Google Code upload server said: %s (%s)' % (reason, status)
      print
      failures += 1

  print "Upload status: %d successes, %d failures." % (successes, failures)
  return failures


if __name__ == '__main__':
  sys.exit(main())